New Warp Scheduler + VCD Enable
This commit is contained in:
198
rtl/VX_fetch.v
198
rtl/VX_fetch.v
@@ -3,7 +3,6 @@
|
||||
|
||||
module VX_fetch (
|
||||
input wire clk,
|
||||
input wire reset,
|
||||
input wire in_memory_delay,
|
||||
input wire in_branch_stall,
|
||||
input wire in_fwd_stall,
|
||||
@@ -21,169 +20,68 @@ module VX_fetch (
|
||||
VX_warp_ctl_inter VX_warp_ctl
|
||||
);
|
||||
|
||||
wire in_change_mask = VX_warp_ctl.change_mask;
|
||||
wire in_wspawn = VX_warp_ctl.wspawn;
|
||||
wire[31:0] in_wspawn_pc = VX_warp_ctl.wspawn_pc;
|
||||
wire in_ebreak = VX_warp_ctl.ebreak;
|
||||
wire[`NW_M1:0] in_decode_warp_num = VX_warp_ctl.warp_num;
|
||||
|
||||
|
||||
// Inputs
|
||||
wire in_freeze = out_delay || in_memory_delay;
|
||||
|
||||
|
||||
// wire in_thread_mask[`NT_M1:0];
|
||||
|
||||
// genvar ind;
|
||||
// for (ind = 0; ind <= `NT_M1; ind = ind + 1) assign in_thread_mask[ind] = VX_warp_ctl.thread_mask[ind];
|
||||
// Locals
|
||||
wire pipe_stall;
|
||||
wire warp_stall;
|
||||
|
||||
|
||||
assign pipe_stall = in_gpr_stall || in_fwd_stall || in_freeze;
|
||||
|
||||
reg stall;
|
||||
reg[31:0] out_PC;
|
||||
assign warp_stall = in_branch_stall || (in_branch_stall_exe && 0);
|
||||
|
||||
reg[`NW_M1:0] warp_num;
|
||||
reg[`NW_M1:0] warp_state;
|
||||
reg[`NW_M1:0] warp_count;
|
||||
wire[`NT_M1:0] thread_mask;
|
||||
wire[`NW_M1:0] warp_num;
|
||||
wire[31:0] warp_pc;
|
||||
VX_warp_scheduler warp_scheduler(
|
||||
.clk (clk),
|
||||
.stall (pipe_stall),
|
||||
// Wspawn
|
||||
.wspawn (VX_warp_ctl.wspawn),
|
||||
.wsapwn_pc (VX_warp_ctl.wspawn_pc),
|
||||
// CTM
|
||||
.ctm (VX_warp_ctl.change_mask),
|
||||
.ctm_mask (VX_warp_ctl.thread_mask),
|
||||
.ctm_warp_num (VX_warp_ctl.warp_num),
|
||||
// WHALT
|
||||
.whalt (VX_warp_ctl.ebreak),
|
||||
.whalt_warp_num (VX_warp_ctl.warp_num),
|
||||
// Wstall
|
||||
.wstall (warp_stall),
|
||||
.wstall_warp_num(VX_warp_ctl.warp_num),
|
||||
|
||||
// reg[31:0] num_ecalls;
|
||||
// JAL
|
||||
.jal (VX_jal_rsp.jal),
|
||||
.jal_dest (VX_jal_rsp.jal_dest),
|
||||
.jal_warp_num (VX_jal_rsp.jal_warp_num),
|
||||
|
||||
initial begin
|
||||
warp_num = 0;
|
||||
warp_state = 0;
|
||||
// num_ecalls = 0;
|
||||
warp_count = 1;
|
||||
end
|
||||
|
||||
|
||||
// always @(posedge clk) begin
|
||||
// if (in_ebreak) begin
|
||||
// num_ecalls <= num_ecalls + 1;
|
||||
// $display("--------> New num_ecalls = %h", num_ecalls+1);
|
||||
// end
|
||||
// end
|
||||
|
||||
wire add_warp = in_wspawn && !in_ebreak && !in_gpr_stall;
|
||||
wire remove_warp = in_ebreak && !in_wspawn && !in_gpr_stall;
|
||||
|
||||
wire[`NW_M1:0] new_warp_state;
|
||||
wire[`NW_M1:0] new_warp_count;
|
||||
|
||||
assign new_warp_count = add_warp ? (warp_count + 1) : ((remove_warp ) ? (warp_count - 1) : (warp_count ));
|
||||
assign new_warp_state = add_warp ? (warp_state + 1) : ((remove_warp && (warp_count == 3)) ? (0 ) : ( warp_state ));
|
||||
|
||||
wire[`NW_M1:0] new_warp_num ;
|
||||
|
||||
assign new_warp_num = (reset || (warp_num >= warp_state) || remove_warp || add_warp) ? 0 : (warp_num + 1);
|
||||
|
||||
always @(posedge clk or posedge reset) begin
|
||||
warp_num <= new_warp_num;
|
||||
warp_state <= new_warp_state;
|
||||
warp_count <= new_warp_count;
|
||||
end
|
||||
|
||||
// always @(posedge clk or posedge reset) begin
|
||||
// if (reset || (warp_num >= warp_state) || remove_warp || add_warp) begin
|
||||
// warp_num <= 0;
|
||||
// end else begin
|
||||
// warp_num <= warp_num + 1;
|
||||
// end
|
||||
|
||||
// if (add_warp) begin
|
||||
// warp_state <= warp_state + 1;
|
||||
// warp_count <= warp_count + 1;
|
||||
// // $display("Adding a new warp %h", warp_state+1);
|
||||
// end else if (remove_warp) begin // No removing, just invalidating
|
||||
// warp_count <= warp_count - 1;
|
||||
// if (warp_count == 2) begin
|
||||
// warp_state <= 0;
|
||||
// end
|
||||
// end
|
||||
// end
|
||||
|
||||
assign out_ebreak = (in_decode_warp_num == 0) && in_ebreak;
|
||||
|
||||
|
||||
assign stall = in_gpr_stall || in_branch_stall || in_fwd_stall || in_branch_stall_exe || in_freeze;
|
||||
|
||||
assign out_which_wspawn = (warp_state+1);
|
||||
|
||||
`ifdef ONLY
|
||||
|
||||
`else
|
||||
|
||||
wire[`NW-1:0][31:0] warp_glob_pc;
|
||||
wire[`NW-1:0][`NT_M1:0] warp_glob_valid;
|
||||
genvar cur_warp;
|
||||
generate
|
||||
for (cur_warp = 0; cur_warp < `NW; cur_warp = cur_warp + 1)
|
||||
begin
|
||||
wire warp_zero_change_mask = in_change_mask && (in_decode_warp_num == cur_warp);
|
||||
wire warp_zero_jal = VX_jal_rsp.jal && (VX_jal_rsp.jal_warp_num == cur_warp);
|
||||
wire warp_zero_branch = VX_branch_rsp.branch_dir && (VX_branch_rsp.branch_warp_num == cur_warp);
|
||||
wire warp_zero_stall = stall || (warp_num != cur_warp);
|
||||
wire warp_zero_wspawn = (cur_warp == 0) ? 0 : (in_wspawn && ((warp_state+1) == cur_warp));
|
||||
wire[31:0] warp_zero_wspawn_pc = in_wspawn_pc;
|
||||
wire warp_zero_remove = remove_warp && (in_decode_warp_num == cur_warp);
|
||||
|
||||
VX_warp VX_Warp(
|
||||
.clk (clk),
|
||||
.reset (reset),
|
||||
.stall (warp_zero_stall),
|
||||
.remove (warp_zero_remove),
|
||||
.in_thread_mask(VX_warp_ctl.thread_mask),
|
||||
.in_change_mask(warp_zero_change_mask),
|
||||
.in_jal (warp_zero_jal),
|
||||
.in_jal_dest (VX_jal_rsp.jal_dest),
|
||||
.in_branch_dir (warp_zero_branch),
|
||||
.in_branch_dest(VX_branch_rsp.branch_dest),
|
||||
.in_wspawn (warp_zero_wspawn),
|
||||
.in_wspawn_pc (warp_zero_wspawn_pc),
|
||||
.out_PC (warp_glob_pc[cur_warp]),
|
||||
.out_valid (warp_glob_valid[cur_warp])
|
||||
);
|
||||
end
|
||||
endgenerate
|
||||
|
||||
|
||||
|
||||
reg[31:0] out_PC_var;
|
||||
reg[`NT_M1:0] out_valid_var;
|
||||
|
||||
always @(*) begin : help
|
||||
integer g;
|
||||
integer h;
|
||||
for (g = 0; g < `NW; g = g + 1)
|
||||
begin
|
||||
if (warp_num == g[`NW_M1:0])
|
||||
begin
|
||||
out_PC_var = warp_glob_pc[g][31:0];
|
||||
for (h = 0; h < `NT; h = h + 1) out_valid_var[h] = warp_glob_valid[g][h];
|
||||
end
|
||||
|
||||
end
|
||||
end
|
||||
|
||||
assign out_PC = out_PC_var;
|
||||
|
||||
`endif
|
||||
// Branch
|
||||
.branch_valid (VX_branch_rsp.valid_branch),
|
||||
.branch_dir (VX_branch_rsp.branch_dir),
|
||||
.branch_dest (VX_branch_rsp.branch_dest),
|
||||
.branch_warp_num(VX_branch_rsp.branch_warp_num),
|
||||
|
||||
// Outputs
|
||||
.thread_mask (thread_mask),
|
||||
.warp_num (warp_num),
|
||||
.warp_pc (warp_pc),
|
||||
.out_ebreak (out_ebreak)
|
||||
);
|
||||
|
||||
|
||||
assign out_delay = 0;
|
||||
assign out_which_wspawn = 0;
|
||||
|
||||
assign icache_request.pc_address = out_PC;
|
||||
assign icache_request.pc_address = warp_pc;
|
||||
assign fe_inst_meta_fd.warp_num = warp_num;
|
||||
assign fe_inst_meta_fd.valid = thread_mask;
|
||||
|
||||
assign out_delay = 0;
|
||||
// assign fe_inst_meta_fd.instruction = (pipe_stall || warp_stall) ? 32'b0 : icache_response.instruction;;
|
||||
assign fe_inst_meta_fd.instruction = (thread_mask == 0) ? 32'0 : icache_response.instruction;;
|
||||
assign fe_inst_meta_fd.inst_pc = warp_pc;
|
||||
|
||||
assign fe_inst_meta_fd.warp_num = warp_num;
|
||||
|
||||
genvar index;
|
||||
for (index = 0; index <= `NT_M1; index = index + 1) assign fe_inst_meta_fd.valid[index] = out_valid_var[index];
|
||||
|
||||
assign fe_inst_meta_fd.instruction = (stall) ? 32'b0 : icache_response.instruction;;
|
||||
assign fe_inst_meta_fd.inst_pc = out_PC;
|
||||
|
||||
// always @(*) begin
|
||||
// $display("fetch: icache_request: %x", out_PC);
|
||||
// end
|
||||
|
||||
endmodule
|
||||
Reference in New Issue
Block a user