diff --git a/hw/rtl/VX_scheduler.v b/hw/rtl/VX_scheduler.v index 1d9f3149..8b3df579 100644 --- a/hw/rtl/VX_scheduler.v +++ b/hw/rtl/VX_scheduler.v @@ -16,29 +16,29 @@ module VX_scheduler #( output wire schedule_delay, output wire is_empty ); - localparam CTVW = `CLOG2(`NUM_WARPS * 32 + 1); + localparam CTVW = `CLOG2(`NUM_WARPS * `NUM_REGS + 1); - reg [31:0][`NUM_THREADS-1:0] rename_table[`NUM_WARPS-1:0]; + reg [`NUM_REGS-1:0][`NUM_THREADS-1:0] rename_table [`NUM_WARPS-1:0]; + reg [`NUM_REGS-1:0] busy_table[`NUM_WARPS-1:0]; reg [CTVW-1:0] count_valid; - wire rs1_rename = (rename_table[decode_if.warp_num][decode_if.rs1] != 0); - wire rs2_rename = (rename_table[decode_if.warp_num][decode_if.rs2] != 0); - wire rd_rename = (rename_table[decode_if.warp_num][decode_if.rd ] != 0); + wire rs1_rename = busy_table[decode_if.warp_num][decode_if.rs1]; + wire rs2_rename = busy_table[decode_if.warp_num][decode_if.rs2]; + wire rd_rename = busy_table[decode_if.warp_num][decode_if.rd]; wire rs1_rename_qual = (rs1_rename) && (decode_if.use_rs1); wire rs2_rename_qual = (rs2_rename) && (decode_if.use_rs2); wire rd_rename_qual = (rd_rename) && (decode_if.wb != 0); - wire rename_valid = (| decode_if.valid) && (rs1_rename_qual || rs2_rename_qual || rd_rename_qual); + wire rename_valid = (rs1_rename_qual || rs2_rename_qual || rd_rename_qual); - wire ex_stalled = (| decode_if.valid) - && ((alu_busy && (decode_if.ex_type == `EX_ALU)) + wire ex_stalled = ((alu_busy && (decode_if.ex_type == `EX_ALU)) || (lsu_busy && (decode_if.ex_type == `EX_LSU)) || (csr_busy && (decode_if.ex_type == `EX_CSR)) || (mul_busy && (decode_if.ex_type == `EX_MUL)) || (gpu_busy && (decode_if.ex_type == `EX_GPU))); - wire stall = ex_stalled || rename_valid; + wire stall = (ex_stalled || rename_valid) && (| decode_if.valid); wire acquire_rd = (| decode_if.valid) && (decode_if.wb != 0) && ~stall; @@ -49,23 +49,25 @@ module VX_scheduler #( reg [CTVW-1:0] count_valid_next = (acquire_rd && !(release_rd && (0 == valid_wb_new_mask))) ? (count_valid + 1) : (~acquire_rd && (release_rd && (0 == valid_wb_new_mask))) ? (count_valid - 1) : count_valid; - integer i, w; - - always @(posedge clk) begin + always @(posedge clk) begin if (reset) begin + integer i, w; for (w = 0; w < `NUM_WARPS; w++) begin for (i = 0; i < 32; i++) begin rename_table[w][i] <= 0; + busy_table[w][i] <= 0; end - end - count_valid <= 0; + end + count_valid <= 0; end else begin if (acquire_rd) begin rename_table[decode_if.warp_num][decode_if.rd] <= decode_if.valid; + busy_table[decode_if.warp_num][decode_if.rd] <= 1; end if (release_rd) begin assert(rename_table[writeback_if.warp_num][writeback_if.rd] != 0); rename_table[writeback_if.warp_num][writeback_if.rd] <= valid_wb_new_mask; + busy_table[writeback_if.warp_num][writeback_if.rd] <= (| valid_wb_new_mask); end count_valid <= count_valid_next; end