fixed snoop forwarding bug and single bank support
This commit is contained in:
@@ -15,8 +15,8 @@ DBG_PRINT_FLAGS = -DDBG_PRINT_CORE_ICACHE \
|
||||
#DBG_PRINT=$(DBG_PRINT_FLAGS)
|
||||
|
||||
#MULTICORE += -DNUM_CLUSTERS=2 -DNUM_CORES=4
|
||||
MULTICORE += -DNUM_CLUSTERS=1 -DNUM_CORES=4
|
||||
#MULTICORE += -DNUM_CLUSTERS=1 -DNUM_CORES=2
|
||||
#MULTICORE += -DNUM_CLUSTERS=1 -DNUM_CORES=4
|
||||
MULTICORE += -DNUM_CLUSTERS=1 -DNUM_CORES=2
|
||||
|
||||
#DEBUG = 1
|
||||
|
||||
|
||||
File diff suppressed because it is too large
Load Diff
@@ -158,7 +158,7 @@
|
||||
|
||||
// Number of banks {1, 2, 4, 8,...}
|
||||
`ifndef INUM_BANKS
|
||||
`define INUM_BANKS 8
|
||||
`define INUM_BANKS 1
|
||||
`endif
|
||||
|
||||
// Size of a word in bytes
|
||||
|
||||
32
hw/rtl/cache/VX_bank.v
vendored
32
hw/rtl/cache/VX_bank.v
vendored
@@ -714,17 +714,31 @@ module VX_bank #(
|
||||
|| dram_fill_req_stall;
|
||||
|
||||
`ifdef DBG_PRINT_CACHE_BANK
|
||||
always_ff @(posedge clk) begin
|
||||
if (dram_fill_req_valid && dram_fill_req_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_fill req: addr=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_fill_req_addr, BANK_ID));
|
||||
if (NUM_BANKS == 1) begin
|
||||
always_ff @(posedge clk) begin
|
||||
if (dram_fill_req_valid && dram_fill_req_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_fill req: addr=%0h", $time, CACHE_ID, BANK_ID, dram_fill_req_addr);
|
||||
end
|
||||
if (dram_wb_req_valid && dram_wb_req_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_wb req: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, dram_wb_req_addr, dram_wb_req_data);
|
||||
end
|
||||
if (dram_fill_rsp_valid && dram_fill_rsp_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_fill rsp: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, dram_fill_rsp_addr, dram_fill_rsp_data);
|
||||
end
|
||||
end
|
||||
if (dram_wb_req_valid && dram_wb_req_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_wb req: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_wb_req_addr, BANK_ID), dram_wb_req_data);
|
||||
end else begin
|
||||
always_ff @(posedge clk) begin
|
||||
if (dram_fill_req_valid && dram_fill_req_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_fill req: addr=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_fill_req_addr, BANK_ID));
|
||||
end
|
||||
if (dram_wb_req_valid && dram_wb_req_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_wb req: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_wb_req_addr, BANK_ID), dram_wb_req_data);
|
||||
end
|
||||
if (dram_fill_rsp_valid && dram_fill_rsp_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_fill rsp: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_fill_rsp_addr, BANK_ID), dram_fill_rsp_data);
|
||||
end
|
||||
end
|
||||
if (dram_fill_rsp_valid && dram_fill_rsp_ready) begin
|
||||
$display("%t: bank%02d:%01d dram_fill rsp: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_fill_rsp_addr, BANK_ID), dram_fill_rsp_data);
|
||||
end
|
||||
end
|
||||
end
|
||||
`endif
|
||||
|
||||
endmodule : VX_bank
|
||||
40
hw/rtl/cache/VX_cache.v
vendored
40
hw/rtl/cache/VX_cache.v
vendored
@@ -287,25 +287,43 @@ module VX_cache #(
|
||||
assign per_bank_core_rsp_data [i] = curr_bank_core_rsp_data;
|
||||
|
||||
// Dram fill request
|
||||
assign per_bank_dram_fill_req_valid[i] = curr_bank_dram_fill_req_valid;
|
||||
assign per_bank_dram_fill_req_addr[i] = `LINE_TO_DRAM_ADDR(curr_bank_dram_fill_req_addr, i);
|
||||
assign curr_bank_dram_fill_req_ready = dram_fill_req_ready;
|
||||
assign per_bank_dram_fill_req_valid[i] = curr_bank_dram_fill_req_valid;
|
||||
if (NUM_BANKS == 1) begin
|
||||
assign per_bank_dram_fill_req_addr[i] = curr_bank_dram_fill_req_addr;
|
||||
end else begin
|
||||
assign per_bank_dram_fill_req_addr[i] = `LINE_TO_DRAM_ADDR(curr_bank_dram_fill_req_addr, i);
|
||||
end
|
||||
assign curr_bank_dram_fill_req_ready = dram_fill_req_ready;
|
||||
|
||||
// Dram fill response
|
||||
assign curr_bank_dram_fill_rsp_valid = dram_rsp_valid && (`DRAM_ADDR_BANK(dram_rsp_tag) == i);
|
||||
assign curr_bank_dram_fill_rsp_addr = `DRAM_TO_LINE_ADDR(dram_rsp_tag);
|
||||
if (NUM_BANKS == 1) begin
|
||||
assign curr_bank_dram_fill_rsp_valid = dram_rsp_valid;
|
||||
assign curr_bank_dram_fill_rsp_addr = dram_rsp_tag;
|
||||
end else begin
|
||||
assign curr_bank_dram_fill_rsp_valid = dram_rsp_valid && (`DRAM_ADDR_BANK(dram_rsp_tag) == i);
|
||||
assign curr_bank_dram_fill_rsp_addr = `DRAM_TO_LINE_ADDR(dram_rsp_tag);
|
||||
end
|
||||
assign curr_bank_dram_fill_rsp_data = dram_rsp_data;
|
||||
assign per_bank_dram_fill_rsp_ready[i] = curr_bank_dram_fill_rsp_ready;
|
||||
|
||||
// Dram writeback request
|
||||
assign per_bank_dram_wb_req_valid[i] = curr_bank_dram_wb_req_valid;
|
||||
assign per_bank_dram_wb_req_addr[i] = `LINE_TO_DRAM_ADDR(curr_bank_dram_wb_req_addr, i);
|
||||
assign per_bank_dram_wb_req_data[i] = curr_bank_dram_wb_req_data;
|
||||
assign curr_bank_dram_wb_req_ready = per_bank_dram_wb_req_ready[i];
|
||||
assign per_bank_dram_wb_req_valid[i] = curr_bank_dram_wb_req_valid;
|
||||
if (NUM_BANKS == 1) begin
|
||||
assign per_bank_dram_wb_req_addr[i] = curr_bank_dram_wb_req_addr;
|
||||
end else begin
|
||||
assign per_bank_dram_wb_req_addr[i] = `LINE_TO_DRAM_ADDR(curr_bank_dram_wb_req_addr, i);
|
||||
end
|
||||
assign per_bank_dram_wb_req_data[i] = curr_bank_dram_wb_req_data;
|
||||
assign curr_bank_dram_wb_req_ready = per_bank_dram_wb_req_ready[i];
|
||||
|
||||
// Snoop request
|
||||
assign curr_bank_snp_req_valid = snp_req_valid_qual && (`DRAM_ADDR_BANK(snp_req_addr_qual) == i);
|
||||
assign curr_bank_snp_req_addr = `DRAM_TO_LINE_ADDR(snp_req_addr_qual);
|
||||
if (NUM_BANKS == 1) begin
|
||||
assign curr_bank_snp_req_valid = snp_req_valid_qual;
|
||||
assign curr_bank_snp_req_addr = snp_req_addr_qual;
|
||||
end else begin
|
||||
assign curr_bank_snp_req_valid = snp_req_valid_qual && (`DRAM_ADDR_BANK(snp_req_addr_qual) == i);
|
||||
assign curr_bank_snp_req_addr = `DRAM_TO_LINE_ADDR(snp_req_addr_qual);
|
||||
end
|
||||
assign curr_bank_snp_req_tag = snp_req_tag_qual;
|
||||
assign per_bank_snp_req_ready[i] = curr_bank_snp_req_ready;
|
||||
|
||||
|
||||
20
hw/rtl/cache/VX_cache_core_req_bank_sel.v
vendored
20
hw/rtl/cache/VX_cache_core_req_bank_sel.v
vendored
@@ -12,18 +12,24 @@ module VX_cache_core_req_bank_sel #(
|
||||
parameter NUM_REQUESTS = 0
|
||||
) (
|
||||
input wire [NUM_REQUESTS-1:0] core_req_valid,
|
||||
`IGNORE_WARNINGS_BEGIN
|
||||
input wire [NUM_REQUESTS-1:0][31:0] core_req_addr,
|
||||
`IGNORE_WARNINGS_END
|
||||
output reg [NUM_BANKS-1:0][NUM_REQUESTS-1:0] per_bank_valids
|
||||
);
|
||||
integer i;
|
||||
|
||||
always @(*) begin
|
||||
per_bank_valids = 0;
|
||||
for (i = 0; i < NUM_REQUESTS; i++) begin
|
||||
if (NUM_BANKS == 1) begin
|
||||
// If there is only one bank, then only map requests to that bank
|
||||
|
||||
if (NUM_BANKS == 1) begin
|
||||
always @(*) begin
|
||||
per_bank_valids = 0;
|
||||
for (i = 0; i < NUM_REQUESTS; i++) begin
|
||||
per_bank_valids[0][i] = core_req_valid[i];
|
||||
end else begin
|
||||
end
|
||||
end
|
||||
end else begin
|
||||
always @(*) begin
|
||||
per_bank_valids = 0;
|
||||
for (i = 0; i < NUM_REQUESTS; i++) begin
|
||||
per_bank_valids[core_req_addr[i][`BANK_SELECT_ADDR_RNG]][i] = core_req_valid[i];
|
||||
end
|
||||
end
|
||||
|
||||
41
hw/rtl/cache/VX_cache_miss_resrv.v
vendored
41
hw/rtl/cache/VX_cache_miss_resrv.v
vendored
@@ -156,18 +156,35 @@ module VX_cache_miss_resrv #(
|
||||
|
||||
`ifdef DBG_PRINT_CACHE_MSRQ
|
||||
integer j;
|
||||
always_ff @(posedge clk) begin
|
||||
if (mrvq_push || mrvq_pop) begin
|
||||
$write("%t: bank%02d:%01d msrq: push=%b pop=%b", $time, CACHE_ID, BANK_ID, mrvq_push, mrvq_pop);
|
||||
for (j = 0; j < MRVQ_SIZE; j++) begin
|
||||
if (valid_table[j]) begin
|
||||
$write(" ");
|
||||
if (schedule_ptr == $bits(schedule_ptr)'(j)) $write("*");
|
||||
if (~ready_table[j]) $write("!");
|
||||
$write("addr%0d=%0h", j, `LINE_TO_BYTE_ADDR(addr_table[j], BANK_ID));
|
||||
end
|
||||
end
|
||||
$write("\n");
|
||||
if (NUM_BANKS == 1) begin
|
||||
always_ff @(posedge clk) begin
|
||||
if (mrvq_push || mrvq_pop) begin
|
||||
$write("%t: bank%02d:%01d msrq: push=%b pop=%b", $time, CACHE_ID, BANK_ID, mrvq_push, mrvq_pop);
|
||||
for (j = 0; j < MRVQ_SIZE; j++) begin
|
||||
if (valid_table[j]) begin
|
||||
$write(" ");
|
||||
if (schedule_ptr == $bits(schedule_ptr)'(j)) $write("*");
|
||||
if (~ready_table[j]) $write("!");
|
||||
$write("addr%0d=%0h", j, {addr_table[j], `BASE_ADDR_BITS'(0)});
|
||||
end
|
||||
end
|
||||
$write("\n");
|
||||
end
|
||||
end
|
||||
end else begin
|
||||
always_ff @(posedge clk) begin
|
||||
if (mrvq_push || mrvq_pop) begin
|
||||
$write("%t: bank%02d:%01d msrq: push=%b pop=%b", $time, CACHE_ID, BANK_ID, mrvq_push, mrvq_pop);
|
||||
for (j = 0; j < MRVQ_SIZE; j++) begin
|
||||
if (valid_table[j]) begin
|
||||
$write(" ");
|
||||
if (schedule_ptr == $bits(schedule_ptr)'(j)) $write("*");
|
||||
if (~ready_table[j]) $write("!");
|
||||
$write("addr%0d=%0h", j, `LINE_TO_BYTE_ADDR(addr_table[j], BANK_ID));
|
||||
end
|
||||
end
|
||||
$write("\n");
|
||||
end
|
||||
end
|
||||
end
|
||||
`endif
|
||||
|
||||
40
hw/rtl/cache/VX_snp_forwarder.v
vendored
40
hw/rtl/cache/VX_snp_forwarder.v
vendored
@@ -34,11 +34,13 @@ module VX_snp_forwarder #(
|
||||
output wire [NUM_REQUESTS-1:0] snp_fwdin_ready
|
||||
);
|
||||
reg [`DRAM_ADDR_WIDTH+SNP_REQ_TAG_WIDTH-1:0] pending_reqs [SNRQ_SIZE-1:0];
|
||||
reg [`REQS_BITS-1:0] pending_cntrs [SNRQ_SIZE-1:0];
|
||||
reg [`LOG2UP(SNRQ_SIZE)-1:0] rd_ptr, wr_ptr;
|
||||
reg [`LOG2UP(SNRQ_SIZE)-1:0] pending_size;
|
||||
reg [`REQS_BITS:0] pending_cntrs [SNRQ_SIZE-1:0];
|
||||
reg [`LOG2UP(SNRQ_SIZE):0] rd_ptr, wr_ptr;
|
||||
reg [`REQS_BITS-1:0] fwdin_sel;
|
||||
wire enqueue, dequeue, empty;
|
||||
|
||||
wire [`LOG2UP(SNRQ_SIZE)-1:0] rd_a, wr_a;
|
||||
|
||||
wire enqueue, dequeue, empty, full;
|
||||
|
||||
wire fwdout_ready;
|
||||
|
||||
@@ -49,47 +51,43 @@ module VX_snp_forwarder #(
|
||||
|
||||
assign fwdout_ready = (& snp_fwdout_ready);
|
||||
|
||||
assign snp_req_ready = (pending_size != `LOG2UP(SNRQ_SIZE)'(SNRQ_SIZE-1)) // not full
|
||||
&& fwdout_ready;
|
||||
assign snp_req_ready = !full && fwdout_ready;
|
||||
|
||||
assign rd_a = rd_ptr[`LOG2UP(SNRQ_SIZE)-1:0];
|
||||
assign wr_a = wr_ptr[`LOG2UP(SNRQ_SIZE)-1:0];
|
||||
|
||||
genvar i;
|
||||
|
||||
for (i = 0; i < NUM_REQUESTS; i++) begin
|
||||
assign snp_fwdout_valid[i] = enqueue && fwdout_ready;
|
||||
assign snp_fwdout_addr[i] = snp_req_addr;
|
||||
assign snp_fwdout_tag[i] = wr_ptr;
|
||||
assign snp_fwdout_tag[i] = wr_a;
|
||||
end
|
||||
|
||||
assign fwdin_ready = snp_rsp_ready;
|
||||
|
||||
assign fwdin_taken = fwdin_valid && fwdin_ready;
|
||||
|
||||
assign snp_rsp_valid = fwdin_taken && (1 == pending_cntrs[fwdin_tag]); // send response
|
||||
assign {snp_rsp_addr, snp_rsp_tag} = pending_reqs[fwdin_tag];
|
||||
|
||||
assign empty = (wr_ptr == rd_ptr);
|
||||
assign full = (wr_a == rd_a) && (wr_ptr[`LOG2UP(SNRQ_SIZE)] != rd_ptr[`LOG2UP(SNRQ_SIZE)]);
|
||||
|
||||
assign enqueue = snp_req_valid && snp_req_ready;
|
||||
assign dequeue = !empty && (0 == pending_cntrs[rd_ptr]);
|
||||
assign dequeue = !empty && (0 == pending_cntrs[rd_a]);
|
||||
|
||||
always @(posedge clk) begin
|
||||
if (reset) begin
|
||||
rd_ptr <= 0;
|
||||
wr_ptr <= 0;
|
||||
pending_size <= 0;
|
||||
rd_ptr <= 0;
|
||||
wr_ptr <= 0;
|
||||
end else begin
|
||||
if (enqueue) begin
|
||||
pending_reqs[wr_ptr] <= {snp_req_addr, snp_req_tag};
|
||||
pending_cntrs[wr_ptr] <= `REQS_BITS'(NUM_REQUESTS);
|
||||
wr_ptr <= wr_ptr + 1;
|
||||
if (!dequeue) begin
|
||||
pending_size <= pending_size + 1;
|
||||
end
|
||||
pending_reqs[wr_a] <= {snp_req_addr, snp_req_tag};
|
||||
pending_cntrs[wr_a] <= NUM_REQUESTS;
|
||||
wr_ptr <= wr_ptr + 1;
|
||||
end
|
||||
if (dequeue) begin
|
||||
rd_ptr <= rd_ptr + 1;
|
||||
if (!enqueue) begin
|
||||
pending_size <= pending_size - 1;
|
||||
end
|
||||
end
|
||||
if (fwdin_taken) begin
|
||||
pending_cntrs[fwdin_tag] <= pending_cntrs[fwdin_tag] - 1;
|
||||
|
||||
@@ -190,6 +190,10 @@ void Simulator::flush_caches(uint32_t mem_addr, uint32_t size) {
|
||||
|
||||
int pending_snp_reqs = 1;
|
||||
|
||||
#ifdef DBG_PRINT_CACHE_SNP
|
||||
std::cout << timestamp << ": [sim] snp req: addr=" << std::hex << vortex_->snp_req_addr << std::dec << " tag=" << vortex_->snp_req_tag << " remain=" << (aligned_addr_end - vortex_->snp_req_addr - 1) << std::endl;
|
||||
#endif
|
||||
|
||||
for (;;) {
|
||||
this->step();
|
||||
if (vortex_->snp_rsp_valid) {
|
||||
@@ -200,12 +204,12 @@ void Simulator::flush_caches(uint32_t mem_addr, uint32_t size) {
|
||||
#endif
|
||||
}
|
||||
if (vortex_->snp_req_valid && vortex_->snp_req_ready) {
|
||||
if (vortex_->snp_req_addr < aligned_addr_end) {
|
||||
if (vortex_->snp_req_addr + 1 < aligned_addr_end) {
|
||||
vortex_->snp_req_addr += 1;
|
||||
vortex_->snp_req_tag += 1;
|
||||
++pending_snp_reqs;
|
||||
#ifdef DBG_PRINT_CACHE_SNP
|
||||
std::cout << timestamp << ": [sim] snp req: addr=" << vortex_->snp_req_addr << " tag=" << vortex_->snp_req_tag << " remain=" << (aligned_addr_end - vortex_->snp_req_addr) << std::endl;
|
||||
std::cout << timestamp << ": [sim] snp req: addr=" << std::hex << vortex_->snp_req_addr << std::dec << " tag=" << vortex_->snp_req_tag << " remain=" << (aligned_addr_end - vortex_->snp_req_addr - 1) << std::endl;
|
||||
#endif
|
||||
} else {
|
||||
vortex_->snp_req_valid = 0;
|
||||
|
||||
Reference in New Issue
Block a user