`include "VX_cache_config.vh" module VX_bank #( parameter CACHE_ID = 0, parameter BANK_ID = 0, // Size of cache in bytes parameter CACHE_SIZE = 1, // Size of line inside a bank in bytes parameter BANK_LINE_SIZE = 1, // Number of bankS parameter NUM_BANKS = 1, // Size of a word in bytes parameter WORD_SIZE = 1, // Number of Word requests per cycle parameter NUM_REQUESTS = 1, // Core Request Queue Size parameter CREQ_SIZE = 1, // Miss Reserv Queue Knob parameter MRVQ_SIZE = 1, // DRAM Response Queue Size parameter DRFQ_SIZE = 1, // Snoop Req Queue Size parameter SNRQ_SIZE = 1, // Core Writeback Queue Size parameter CWBQ_SIZE = 1, // DRAM Request Queue Size parameter DREQ_SIZE = 1, // Snoop Response Size parameter SNPQ_SIZE = 1, // Enable cache writeable parameter WRITE_ENABLE = 0, // Enable dram update parameter DRAM_ENABLE = 0, // Enable cache flush parameter FLUSH_ENABLE = 0, // core request tag size parameter CORE_TAG_WIDTH = 1, // size of tag id in core request tag parameter CORE_TAG_ID_BITS = 0, // Snooping request tag width parameter SNP_REQ_TAG_WIDTH = 1 ) ( `SCOPE_IO_VX_bank input wire clk, input wire reset, // Core Request input wire [NUM_REQUESTS-1:0] core_req_valid, input wire [`CORE_REQ_TAG_COUNT-1:0] core_req_rw, input wire [NUM_REQUESTS-1:0][WORD_SIZE-1:0] core_req_byteen, input wire [NUM_REQUESTS-1:0][`WORD_ADDR_WIDTH-1:0] core_req_addr, input wire [NUM_REQUESTS-1:0][`WORD_WIDTH-1:0] core_req_data, input wire [`CORE_REQ_TAG_COUNT-1:0][CORE_TAG_WIDTH-1:0] core_req_tag, output wire core_req_ready, // Core Response output wire core_rsp_valid, output wire [`REQS_BITS-1:0] core_rsp_tid, output wire [`WORD_WIDTH-1:0] core_rsp_data, output wire [CORE_TAG_WIDTH-1:0] core_rsp_tag, input wire core_rsp_ready, // DRAM request output wire dram_req_valid, output wire dram_req_rw, output wire [BANK_LINE_SIZE-1:0] dram_req_byteen, output wire [`LINE_ADDR_WIDTH-1:0] dram_req_addr, output wire [`BANK_LINE_WIDTH-1:0] dram_req_data, input wire dram_req_ready, // DRAM response input wire dram_rsp_valid, input wire [`LINE_ADDR_WIDTH-1:0] dram_rsp_addr, input wire [`BANK_LINE_WIDTH-1:0] dram_rsp_data, output wire dram_rsp_ready, // Snoop Request input wire snp_req_valid, input wire [`LINE_ADDR_WIDTH-1:0] snp_req_addr, input wire snp_req_invalidate, input wire [SNP_REQ_TAG_WIDTH-1:0] snp_req_tag, output wire snp_req_ready, // Snoop Response output wire snp_rsp_valid, output wire [SNP_REQ_TAG_WIDTH-1:0] snp_rsp_tag, input wire snp_rsp_ready ); `ifdef DBG_CORE_REQ_INFO /* verilator lint_off UNUSED */ wire[31:0] debug_pc_st0; wire[`NR_BITS-1:0] debug_rd_st0; wire[`NW_BITS-1:0] debug_wid_st0; wire debug_rw_st0; wire[WORD_SIZE-1:0] debug_byteen_st0; wire[`REQS_BITS-1:0] debug_tid_st0; wire[`UP(CORE_TAG_ID_BITS)-1:0] debug_tagid_st0; wire[31:0] debug_pc_st1; wire[`NR_BITS-1:0] debug_rd_st1; wire[`NW_BITS-1:0] debug_wid_st1; wire debug_rw_st1; wire[WORD_SIZE-1:0] debug_byteen_st1; wire[`REQS_BITS-1:0] debug_tid_st1; wire[`UP(CORE_TAG_ID_BITS)-1:0] debug_tagid_st1; wire[31:0] debug_pc_st2; wire[`NR_BITS-1:0] debug_rd_st2; wire[`NW_BITS-1:0] debug_wid_st2; wire debug_rw_st2; wire[WORD_SIZE-1:0] debug_byteen_st2; wire[`REQS_BITS-1:0] debug_tid_st2; wire[`UP(CORE_TAG_ID_BITS)-1:0] debug_tagid_st2; wire[31:0] debug_pc_st3; wire[`NR_BITS-1:0] debug_rd_st3; wire[`NW_BITS-1:0] debug_wid_st3; wire debug_rw_st3; wire[WORD_SIZE-1:0] debug_byteen_st3; wire[`REQS_BITS-1:0] debug_tid_st3; wire[`UP(CORE_TAG_ID_BITS)-1:0] debug_tagid_st3; /* verilator lint_on UNUSED */ `endif wire snrq_pop; wire snrq_empty; wire snrq_full; wire [`LINE_ADDR_WIDTH-1:0] snrq_addr_st0; wire snrq_invalidate_st0; wire [SNP_REQ_TAG_WIDTH-1:0] snrq_tag_st0; wire snp_req_fire = snp_req_valid && snp_req_ready; assign snp_req_ready = !snrq_full; VX_generic_queue #( .DATAW(`LINE_ADDR_WIDTH + 1 + SNP_REQ_TAG_WIDTH), .SIZE(SNRQ_SIZE) ) snp_req_queue ( .clk (clk), .reset (reset), .push (snp_req_fire), .pop (snrq_pop), .data_in ({snp_req_addr, snp_req_invalidate, snp_req_tag}), .data_out({snrq_addr_st0, snrq_invalidate_st0, snrq_tag_st0}), .empty (snrq_empty), .full (snrq_full), `UNUSED_PIN (size) ); wire dfpq_pop; wire dfpq_empty; wire dfpq_full; wire [`LINE_ADDR_WIDTH-1:0] dfpq_addr_st0; wire [`BANK_LINE_WIDTH-1:0] dfpq_filldata_st0; assign dram_rsp_ready = !dfpq_full; if (DRAM_ENABLE) begin wire dram_rsp_fire = dram_rsp_valid && dram_rsp_ready; VX_generic_queue #( .DATAW(`LINE_ADDR_WIDTH + $bits(dram_rsp_data)), .SIZE(DRFQ_SIZE) ) dfp_queue ( .clk (clk), .reset (reset), .push (dram_rsp_fire), .pop (dfpq_pop), .data_in ({dram_rsp_addr, dram_rsp_data}), .data_out({dfpq_addr_st0, dfpq_filldata_st0}), .empty (dfpq_empty), .full (dfpq_full), `UNUSED_PIN (size) ); end else begin `UNUSED_VAR (dram_rsp_valid) `UNUSED_VAR (dram_rsp_addr) `UNUSED_VAR (dram_rsp_data) assign dfpq_empty = 1; assign dfpq_full = 0; assign dfpq_addr_st0 = 0; assign dfpq_filldata_st0 = 0; end wire reqq_pop; wire reqq_empty; wire reqq_full; wire [`REQS_BITS-1:0] reqq_req_tid_st0; wire reqq_req_rw_st0; wire [WORD_SIZE-1:0] reqq_req_byteen_st0; `IGNORE_WARNINGS_BEGIN wire [`WORD_ADDR_WIDTH-1:0] reqq_req_addr_st0; `IGNORE_WARNINGS_END wire [`WORD_WIDTH-1:0] reqq_req_writeword_st0; wire [CORE_TAG_WIDTH-1:0] reqq_req_tag_st0; wire core_req_fire = (| core_req_valid) && core_req_ready; assign core_req_ready = !reqq_full; VX_bank_core_req_arb #( .WORD_SIZE (WORD_SIZE), .NUM_REQUESTS (NUM_REQUESTS), .CREQ_SIZE (CREQ_SIZE), .CORE_TAG_WIDTH (CORE_TAG_WIDTH), .CORE_TAG_ID_BITS (CORE_TAG_ID_BITS) ) core_req_arb ( .clk (clk), .reset (reset), // Enqueue .reqq_push (core_req_fire), .bank_valids (core_req_valid), .bank_rw (core_req_rw), .bank_byteen (core_req_byteen), .bank_addr (core_req_addr), .bank_writedata (core_req_data), .bank_tag (core_req_tag), // Dequeue .reqq_pop (reqq_pop), .reqq_req_tid_st0 (reqq_req_tid_st0), .reqq_req_rw_st0 (reqq_req_rw_st0), .reqq_req_byteen_st0 (reqq_req_byteen_st0), .reqq_req_addr_st0 (reqq_req_addr_st0), .reqq_req_writedata_st0(reqq_req_writeword_st0), .reqq_req_tag_st0 (reqq_req_tag_st0), .reqq_empty (reqq_empty), .reqq_full (reqq_full) ); wire msrq_pop; wire msrq_full; wire msrq_almfull; wire msrq_valid_st0; wire[`REQS_BITS-1:0] msrq_tid_st0; wire [`LINE_ADDR_WIDTH-1:0] msrq_addr_st0; wire [`UP(`WORD_SELECT_WIDTH)-1:0] msrq_wsel_st0; wire [`WORD_WIDTH-1:0] msrq_writeword_st0; wire [`REQ_TAG_WIDTH-1:0] msrq_tag_st0; wire msrq_rw_st0; wire [WORD_SIZE-1:0] msrq_byteen_st0; wire msrq_is_snp_st0; wire msrq_snp_invalidate_st0; wire msrq_pending_hazard_st1; wire is_msrq_miss_st2; wire is_msrq_miss_st3; wire msrq_push_stall; wire cwbq_push_stall; wire dwbq_push_stall; wire snpq_push_stall; wire pipeline_stall; wire is_fill_st1; // determine which queue to pop next in piority order wire msrq_pop_unqual = msrq_valid_st0; wire dfpq_pop_unqual = !msrq_pop_unqual && !dfpq_empty; wire reqq_pop_unqual = !msrq_pop_unqual && !dfpq_pop_unqual && !reqq_empty && !msrq_almfull; wire snrq_pop_unqual = !msrq_pop_unqual && !dfpq_pop_unqual && !reqq_pop_unqual && !snrq_empty && !msrq_almfull; assign msrq_pop = msrq_pop_unqual && !pipeline_stall && !(is_msrq_miss_st2 || is_msrq_miss_st3); // stop if previous request was a miss assign dfpq_pop = dfpq_pop_unqual && !pipeline_stall; assign reqq_pop = reqq_pop_unqual && !pipeline_stall; assign snrq_pop = snrq_pop_unqual && !pipeline_stall; wire is_fill_st0; wire valid_st0; wire [`LINE_ADDR_WIDTH-1:0] addr_st0; wire [`UP(`WORD_SELECT_WIDTH)-1:0] wsel_st0; wire is_msrq_st0; wire [`WORD_WIDTH-1:0] writeword_st0; wire [`BANK_LINE_WIDTH-1:0] writedata_st0; wire [`REQ_INST_META_WIDTH-1:0] inst_meta_st0; wire is_snp_st0; wire snp_invalidate_st0; wire msrq_pending_hazard_unqual_st0; wire valid_st1; wire [`LINE_ADDR_WIDTH-1:0] addr_st1; wire [`UP(`WORD_SELECT_WIDTH)-1:0] wsel_st1; wire [`WORD_WIDTH-1:0] writeword_st1; wire [`REQ_INST_META_WIDTH-1:0] inst_meta_st1; wire [`BANK_LINE_WIDTH-1:0] writedata_st1; wire is_snp_st1; wire snp_invalidate_st1; wire is_msrq_st1; wire msrq_pending_hazard_st1; wire[`LINE_ADDR_WIDTH-1:0] addr_st2; assign is_msrq_st0 = msrq_pop_unqual; assign is_fill_st0 = dfpq_pop_unqual; assign valid_st0 = dfpq_pop || msrq_pop || reqq_pop || snrq_pop; assign addr_st0 = msrq_pop_unqual ? msrq_addr_st0 : dfpq_pop_unqual ? dfpq_addr_st0 : reqq_pop_unqual ? reqq_req_addr_st0[`LINE_SELECT_ADDR_RNG] : snrq_pop_unqual ? snrq_addr_st0 : 0; if (`WORD_SELECT_WIDTH != 0) begin assign wsel_st0 = reqq_pop_unqual ? reqq_req_addr_st0[`WORD_SELECT_WIDTH-1:0] : msrq_pop_unqual ? msrq_wsel_st0 : 0; end else begin `UNUSED_VAR (msrq_wsel_st0) assign wsel_st0 = 0; end assign writedata_st0 = dfpq_filldata_st0; assign inst_meta_st0 = msrq_pop_unqual ? {`REQ_TAG_WIDTH'(msrq_tag_st0) , msrq_rw_st0, msrq_byteen_st0, msrq_tid_st0} : reqq_pop_unqual ? {`REQ_TAG_WIDTH'(reqq_req_tag_st0), reqq_req_rw_st0, reqq_req_byteen_st0, reqq_req_tid_st0} : snrq_pop_unqual ? {`REQ_TAG_WIDTH'(snrq_tag_st0), 1'b0, WORD_SIZE'(0), `REQS_BITS'(0)} : 0; assign is_snp_st0 = msrq_pop_unqual ? msrq_is_snp_st0 : snrq_pop_unqual ? 1 : 0; assign snp_invalidate_st0 = msrq_pop_unqual ? msrq_snp_invalidate_st0 : snrq_pop_unqual ? snrq_invalidate_st0 : 0; assign writeword_st0 = msrq_pop_unqual ? msrq_writeword_st0 : reqq_pop_unqual ? reqq_req_writeword_st0 : 0; // we have a miss in msrq or in stage 3 for the current address wire msrq_pending_hazard_st0 = msrq_pending_hazard_unqual_st0 || ((miss_st3 || force_miss_st3) && (addr_st3 == addr_st0)); `ifdef DBG_CORE_REQ_INFO if (WORD_SIZE != `GLOBAL_BLOCK_SIZE) begin assign {debug_pc_st0, debug_rd_st0, debug_wid_st0, debug_tagid_st0, debug_rw_st0, debug_byteen_st0, debug_tid_st0} = inst_meta_st0; end `endif VX_generic_register #( .N(1 + 1 + 1 + 1 + 1 + `LINE_ADDR_WIDTH + `UP(`WORD_SELECT_WIDTH) + `WORD_WIDTH + `REQ_INST_META_WIDTH + 1 + `BANK_LINE_WIDTH) ) pipe_reg0 ( .clk (clk), .reset (reset), .stall (pipeline_stall), .flush (1'b0), .in ({is_msrq_st0, is_snp_st0, snp_invalidate_st0, msrq_pending_hazard_st0, valid_st0, addr_st0, wsel_st0, writeword_st0, inst_meta_st0, is_fill_st0, writedata_st0}), .out ({is_msrq_st1, is_snp_st1, snp_invalidate_st1, msrq_pending_hazard_st1, valid_st1, addr_st1, wsel_st1, writeword_st1, inst_meta_st1, is_fill_st1, writedata_st1}) ); `ifdef DBG_CORE_REQ_INFO if (WORD_SIZE != `GLOBAL_BLOCK_SIZE) begin assign {debug_pc_st1, debug_rd_st1, debug_wid_st1, debug_tagid_st1, debug_rw_st1, debug_byteen_st1, debug_tid_st1} = inst_meta_st1; end `endif wire[`TAG_SELECT_BITS-1:0] readtag_st1; wire writeen_st1; wire writeen_st2; wire miss_st1; wire miss_st2; wire miss_st3; wire dirty_st1; wire mem_rw_st1; wire [WORD_SIZE-1:0] mem_byteen_st1; wire force_miss_st2; `DEBUG_BEGIN wire [`REQ_TAG_WIDTH-1:0] tag_st1; wire [`REQS_BITS-1:0] tid_st1; `DEBUG_END assign {tag_st1, mem_rw_st1, mem_byteen_st1, tid_st1} = inst_meta_st1; // we have a matching previous request that missed alreedy wire st2_pending_hazard_st1 = (miss_st2 || force_miss_st2) && (addr_st2 == addr_st1); wire st3_pending_hazard_st1 = (miss_st3 || force_miss_st3) && (addr_st3 == addr_st1); // force miss to ensure commit order when a new request has pending previous requests to same block // also force a miss for msrq requests when previous requests got a miss wire force_miss_st1 = (valid_st1 && !is_msrq_st1 && !is_fill_st1 && (msrq_pending_hazard_st1 || st2_pending_hazard_st1 || st3_pending_hazard_st1)) || (valid_st1 && is_msrq_st1 && is_msrq_miss_st2); VX_tag_access #( .BANK_ID (BANK_ID), .CACHE_ID (CACHE_ID), .CORE_TAG_ID_BITS(CORE_TAG_ID_BITS), .CACHE_SIZE (CACHE_SIZE), .BANK_LINE_SIZE (BANK_LINE_SIZE), .NUM_BANKS (NUM_BANKS), .WORD_SIZE (WORD_SIZE), .DRAM_ENABLE (DRAM_ENABLE), .WRITE_ENABLE (WRITE_ENABLE) ) tag_access ( .clk (clk), .reset (reset), `ifdef DBG_CORE_REQ_INFO .debug_pc_st1 (debug_pc_st1), .debug_rd_st1 (debug_rd_st1), .debug_wid_st1 (debug_wid_st1), .debug_tagid_st1(debug_tagid_st1), `endif .stall (pipeline_stall), // Actual Read/Write .valid_req_st1 (valid_st1), .writefill_st1 (is_fill_st1), .addr_st1 (addr_st1), .mem_rw_st1 (mem_rw_st1), .is_snp_st1 (is_snp_st1), .snp_invalidate_st1(snp_invalidate_st1), .force_miss_st1 (force_miss_st1), // Read Data .readtag_st1 (readtag_st1), .miss_st1 (miss_st1), .dirty_st1 (dirty_st1), .writeen_st1 (writeen_st1) ); wire valid_st2; wire [`UP(`WORD_SELECT_WIDTH)-1:0] wsel_st2; wire [`WORD_WIDTH-1:0] writeword_st2; wire [`WORD_WIDTH-1:0] readword_st2; wire [`BANK_LINE_WIDTH-1:0] readdata_st2; wire [`BANK_LINE_WIDTH-1:0] writedata_st2; wire [WORD_SIZE-1:0] mem_byteen_st2; wire miss_st2; wire dirty_st2; wire [BANK_LINE_SIZE-1:0] dirtyb_st2; wire [`REQ_INST_META_WIDTH-1:0] inst_meta_st2; wire [`TAG_SELECT_BITS-1:0] readtag_st2; wire is_fill_st2; wire is_snp_st2; wire snp_invalidate_st2; wire force_miss_st2; wire is_msrq_st2; VX_generic_register #( .N(1 + 1 + 1 + 1 + 1 + 1 + 1 + `LINE_ADDR_WIDTH + `UP(`WORD_SELECT_WIDTH) + `WORD_WIDTH + `TAG_SELECT_BITS + 1 + 1 + `BANK_LINE_WIDTH + WORD_SIZE + `REQ_INST_META_WIDTH) ) pipe_reg1 ( .clk (clk), .reset (reset), .stall (pipeline_stall), .flush (1'b0), .in ({is_msrq_st1, writeen_st1, force_miss_st1, is_snp_st1, snp_invalidate_st1, is_fill_st1, valid_st1, addr_st1, wsel_st1, writeword_st1, readtag_st1, miss_st1, dirty_st1, writedata_st1, mem_byteen_st1, inst_meta_st1}), .out ({is_msrq_st2, writeen_st2, force_miss_st2, is_snp_st2, snp_invalidate_st2, is_fill_st2, valid_st2, addr_st2, wsel_st2, writeword_st2, readtag_st2, miss_st2, dirty_st2, writedata_st2, mem_byteen_st2, inst_meta_st2}) ); `ifdef DBG_CORE_REQ_INFO if (WORD_SIZE != `GLOBAL_BLOCK_SIZE) begin assign {debug_pc_st2, debug_rd_st2, debug_wid_st2, debug_tagid_st2, debug_rw_st2, debug_byteen_st2, debug_tid_st2} = inst_meta_st2; end `endif assign is_msrq_miss_st2 = (miss_st2 || force_miss_st2) && is_msrq_st2; VX_data_access #( .BANK_ID (BANK_ID), .CACHE_ID (CACHE_ID), .CORE_TAG_ID_BITS(CORE_TAG_ID_BITS), .CACHE_SIZE (CACHE_SIZE), .BANK_LINE_SIZE (BANK_LINE_SIZE), .NUM_BANKS (NUM_BANKS), .WORD_SIZE (WORD_SIZE), .DRAM_ENABLE (DRAM_ENABLE), .WRITE_ENABLE (WRITE_ENABLE) ) data_access ( .clk (clk), .reset (reset), `ifdef DBG_CORE_REQ_INFO .debug_pc_st2 (debug_pc_st2), .debug_rd_st2 (debug_rd_st2), .debug_wid_st2 (debug_wid_st2), .debug_tagid_st2(debug_tagid_st2), `endif .stall (pipeline_stall), // Actual Read/Write .valid_req_st2 (valid_st2), .writeen_st2 (writeen_st2), .writefill_st2 (is_fill_st2), .addr_st2 (addr_st2), .wordsel_st2 (wsel_st2), .mem_byteen_st2 (mem_byteen_st2), .writeword_st2 (writeword_st2), .writedata_st2 (writedata_st2), // Read Data .readword_st2 (readword_st2), .readdata_st2 (readdata_st2), .dirtyb_st2 (dirtyb_st2) ); wire valid_st3; wire [`LINE_ADDR_WIDTH-1:0] addr_st3; wire [`UP(`WORD_SELECT_WIDTH)-1:0] wsel_st3; wire [`WORD_WIDTH-1:0] writeword_st3; wire [`WORD_WIDTH-1:0] readword_st3; wire [`BANK_LINE_WIDTH-1:0] readdata_st3; wire miss_st3; wire dirty_st3; wire [BANK_LINE_SIZE-1:0] dirtyb_st3; wire [`REQ_INST_META_WIDTH-1:0] inst_meta_st3; wire [`TAG_SELECT_BITS-1:0] readtag_st3; wire is_fill_st3; wire is_snp_st3; wire snp_invalidate_st3; wire force_miss_st3; wire is_msrq_st3; VX_generic_register #( .N(1+ 1+ 1 + 1 + 1 + 1 + `LINE_ADDR_WIDTH + `UP(`WORD_SELECT_WIDTH) + `WORD_WIDTH + `WORD_WIDTH + `BANK_LINE_WIDTH + `TAG_SELECT_BITS + 1 + 1 + BANK_LINE_SIZE + `REQ_INST_META_WIDTH) ) pipe_reg2 ( .clk (clk), .reset (reset), .stall (pipeline_stall), .flush (1'b0), .in ({is_msrq_st2, force_miss_st2, is_snp_st2, snp_invalidate_st2, is_fill_st2, valid_st2, addr_st2, wsel_st2, writeword_st2, readword_st2, readdata_st2, readtag_st2, miss_st2, dirty_st2, dirtyb_st2, inst_meta_st2}), .out ({is_msrq_st3, force_miss_st3, is_snp_st3, snp_invalidate_st3, is_fill_st3, valid_st3, addr_st3, wsel_st3, writeword_st3, readword_st3, readdata_st3, readtag_st3, miss_st3, dirty_st3, dirtyb_st3, inst_meta_st3}) ); `ifdef DBG_CORE_REQ_INFO if (WORD_SIZE != `GLOBAL_BLOCK_SIZE) begin assign {debug_pc_st3, debug_rd_st3, debug_wid_st3, debug_tagid_st3, debug_rw_st3, debug_byteen_st3, debug_tid_st3} = inst_meta_st3; end `endif assign is_msrq_miss_st3 = (miss_st3 || force_miss_st3) && is_msrq_st3; // Enqueue to miss reserv if it's a valid miss wire[`REQS_BITS-1:0] miss_add_tid; wire[`REQ_TAG_WIDTH-1:0] miss_add_tag; wire miss_add_rw; wire[WORD_SIZE-1:0] miss_add_byteen; wire miss_add_unqual = miss_st3 || force_miss_st3; assign msrq_push_stall = (miss_st3 || force_miss_st3) && msrq_full; wire miss_add = miss_add_unqual && !msrq_full && !cwbq_push_stall && !dwbq_push_stall && !snpq_push_stall; assign {miss_add_tag, miss_add_rw, miss_add_byteen, miss_add_tid} = inst_meta_st3; // a matching fill request is comming wire incoming_st0_fill_st3 = 0 /*is_fill_st0 && (addr_st3 == dfpq_addr_st0)*/; // clock delay issue wire incoming_st1_fill_st3 = is_fill_st1 && (addr_st3 == addr_st1); wire incoming_st2_fill_st3 = is_fill_st2 && (addr_st3 == addr_st2); wire incoming_fill = incoming_st2_fill_st3 || incoming_st1_fill_st3 || incoming_st0_fill_st3; if (DRAM_ENABLE) begin wire msrq_dequeue_st3 = valid_st3 && is_msrq_st3 && !miss_add_unqual && !pipeline_stall; // mark msrq entry that match DRAM fill as 'ready' wire update_ready_st0 = dfpq_pop; // push missed requests as 'ready' // if it didn't actually missed but had to abort because of pending requets in msrq // or if a matching fill request is coming wire msrq_init_ready_state_st3 = !miss_st3 || incoming_fill; VX_cache_miss_resrv #( .BANK_ID (BANK_ID), .CACHE_ID (CACHE_ID), .CORE_TAG_ID_BITS (CORE_TAG_ID_BITS), .BANK_LINE_SIZE (BANK_LINE_SIZE), .NUM_BANKS (NUM_BANKS), .WORD_SIZE (WORD_SIZE), .NUM_REQUESTS (NUM_REQUESTS), .MRVQ_SIZE (MRVQ_SIZE), .CORE_TAG_WIDTH (CORE_TAG_WIDTH), .SNP_REQ_TAG_WIDTH (SNP_REQ_TAG_WIDTH) ) cache_miss_resrv ( .clk (clk), .reset (reset), `ifdef DBG_CORE_REQ_INFO .debug_pc_st0 (debug_pc_st0), .debug_rd_st0 (debug_rd_st0), .debug_wid_st0 (debug_wid_st0), .debug_tagid_st0(debug_tagid_st0), .debug_pc_st3 (debug_pc_st3), .debug_rd_st3 (debug_rd_st3), .debug_wid_st3 (debug_wid_st3), .debug_tagid_st3(debug_tagid_st3), `endif // enqueue .enqueue_st3 (miss_add), .enqueue_addr_st3 (addr_st3), .enqueue_wsel_st3 (wsel_st3), .enqueue_data_st3 (writeword_st3), .enqueue_tid_st3 (miss_add_tid), .enqueue_tag_st3 (miss_add_tag), .enqueue_rw_st3 (miss_add_rw), .enqueue_byteen_st3 (miss_add_byteen), .enqueue_is_snp_st3 (is_snp_st3), .enqueue_snp_inv_st3 (snp_invalidate_st3), .enqueue_msrq_st3 (is_msrq_st3), .enqueue_ready_st3 (msrq_init_ready_state_st3), .enqueue_full (msrq_full), .enqueue_almfull (msrq_almfull), // fill .update_ready_st0 (update_ready_st0), .addr_st0 (addr_st0), .pending_hazard_st0 (msrq_pending_hazard_unqual_st0), // dequeue .schedule_st0 (msrq_pop), .dequeue_valid_st0 (msrq_valid_st0), .dequeue_addr_st0 (msrq_addr_st0), .dequeue_wsel_st0 (msrq_wsel_st0), .dequeue_data_st0 (msrq_writeword_st0), .dequeue_tid_st0 (msrq_tid_st0), .dequeue_tag_st0 (msrq_tag_st0), .dequeue_rw_st0 (msrq_rw_st0), .dequeue_byteen_st0 (msrq_byteen_st0), .dequeue_is_snp_st0 (msrq_is_snp_st0), .dequeue_snp_inv_st0 (msrq_snp_invalidate_st0), .dequeue_st3 (msrq_dequeue_st3) ); end else begin `UNUSED_VAR (miss_add) `UNUSED_VAR (wsel_st3) `UNUSED_VAR (writeword_st3) `UNUSED_VAR (snp_invalidate_st3) `UNUSED_VAR (miss_add_byteen) assign msrq_pending_hazard_unqual_st0 = 0; assign msrq_full = 0; assign msrq_almfull = 0; assign msrq_valid_st0 = 0; assign msrq_addr_st0 = 0; assign msrq_wsel_st0 = 0; assign msrq_writeword_st0 = 0; assign msrq_tid_st0 = 0; assign msrq_tag_st0 = 0; assign msrq_rw_st0 = 0; assign msrq_byteen_st0 = 0; assign msrq_is_snp_st0 = 0; assign msrq_snp_invalidate_st0 = 0; end // Enqueue core response wire cwbq_empty, cwbq_full; wire cwbq_push_unqual = valid_st3 && !is_fill_st3 && !is_snp_st3 && !miss_st3 && !force_miss_st3 && !miss_add_rw; assign cwbq_push_stall = cwbq_push_unqual && cwbq_full; wire cwbq_push = cwbq_push_unqual && !cwbq_full && !msrq_push_stall && !dwbq_push_stall && !snpq_push_stall; wire cwbq_pop = core_rsp_valid && core_rsp_ready; wire [`REQS_BITS-1:0] cwbq_tid = miss_add_tid; wire [CORE_TAG_WIDTH-1:0] cwbq_tag = CORE_TAG_WIDTH'(miss_add_tag); wire [`WORD_WIDTH-1:0] cwbq_data = readword_st3; VX_generic_queue #( .DATAW(`REQS_BITS + CORE_TAG_WIDTH + `WORD_WIDTH), .SIZE(CWBQ_SIZE) ) cwb_queue ( .clk (clk), .reset (reset), .push (cwbq_push), .pop (cwbq_pop), .data_in ({cwbq_tid, cwbq_tag, cwbq_data}), .data_out({core_rsp_tid, core_rsp_tag, core_rsp_data}), .empty (cwbq_empty), .full (cwbq_full), `UNUSED_PIN (size) ); assign core_rsp_valid = !cwbq_empty; // Enqueue DRAM request wire dwbq_empty, dwbq_full; wire dwbq_is_dfl_in = valid_st3 && miss_st3 && !incoming_fill && (!force_miss_st3 || is_msrq_st3); wire dwbq_is_dwb_in = valid_st3 && dirty_st3 && !force_miss_st3 && (is_fill_st3 || is_snp_st3); wire dwbq_push_unqual = dwbq_is_dfl_in || dwbq_is_dwb_in; assign dwbq_push_stall = dwbq_push_unqual && dwbq_full; wire dwbq_push = dwbq_push_unqual && !dwbq_full && !msrq_push_stall && !cwbq_push_stall && !snpq_push_stall; wire dwbq_pop = dram_req_valid && dram_req_ready; if (DRAM_ENABLE) begin wire [`LINE_ADDR_WIDTH-1:0] dwbq_req_addr = dwbq_is_dwb_in ? {readtag_st3, addr_st3[`LINE_SELECT_BITS-1:0]} : addr_st3; VX_generic_queue #( .DATAW(1 + BANK_LINE_SIZE + `LINE_ADDR_WIDTH + `BANK_LINE_WIDTH), .SIZE(DREQ_SIZE) ) dwb_queue ( .clk (clk), .reset (reset), .push (dwbq_push), .pop (dwbq_pop), .data_in ({dwbq_is_dwb_in, dirtyb_st3, dwbq_req_addr, readdata_st3}), .data_out({dram_req_rw, dram_req_byteen, dram_req_addr, dram_req_data}), .empty (dwbq_empty), .full (dwbq_full), `UNUSED_PIN (size) ); end else begin `UNUSED_VAR (dwbq_push) `UNUSED_VAR (dwbq_pop) `UNUSED_VAR (readtag_st3) `UNUSED_VAR (dirtyb_st3) `UNUSED_VAR (readdata_st3) assign dwbq_empty = 1; assign dwbq_full = 0; assign dram_req_rw = 0; assign dram_req_byteen = 0; assign dram_req_addr = 0; assign dram_req_data = 0; `UNUSED_VAR (dram_req_ready) end assign dram_req_valid = !dwbq_empty; // Enqueue snoop response wire snpq_empty, snpq_full; wire snpq_push_unqual = valid_st3 && is_snp_st3 && !force_miss_st3; assign snpq_push_stall = snpq_push_unqual && snpq_full; wire snpq_push = snpq_push_unqual && !snpq_full && !msrq_push_stall && !cwbq_push_stall && !dwbq_push_stall; wire snpq_pop = snp_rsp_valid && snp_rsp_ready; wire [SNP_REQ_TAG_WIDTH-1:0] snpq_tag_st3 = SNP_REQ_TAG_WIDTH'(miss_add_tag); if (FLUSH_ENABLE) begin VX_generic_queue #( .DATAW(SNP_REQ_TAG_WIDTH), .SIZE(SNPQ_SIZE) ) snp_queue ( .clk (clk), .reset (reset), .push (snpq_push), .pop (snpq_pop), .data_in (snpq_tag_st3), .data_out(snp_rsp_tag), .empty (snpq_empty), .full (snpq_full), `UNUSED_PIN (size) ); end else begin `UNUSED_VAR (snpq_push) `UNUSED_VAR (snpq_pop) `UNUSED_VAR (snpq_tag_st3) assign snpq_empty = 1; assign snpq_full = 0; assign snp_rsp_tag = 0; `UNUSED_VAR (snp_rsp_ready) end assign snp_rsp_valid = !snpq_empty && dwbq_empty; // ensure all writebacks are sent // bank pipeline stall assign pipeline_stall = msrq_push_stall || cwbq_push_stall || dwbq_push_stall || snpq_push_stall; `SCOPE_ASSIGN (valid_st0, valid_st0); `SCOPE_ASSIGN (valid_st, valid_st1); `SCOPE_ASSIGN (valid_st2, valid_st2); `SCOPE_ASSIGN (valid_st3, valid_st3); `SCOPE_ASSIGN (is_msrq_st1, is_msrq_st1); `SCOPE_ASSIGN (miss_st1, miss_st1); `SCOPE_ASSIGN (dirty_st1, dirty_st1); `SCOPE_ASSIGN (force_miss_st1, force_miss_st1); `SCOPE_ASSIGN (stall_pipe, pipeline_stall); `SCOPE_ASSIGN (addr_st0, `LINE_TO_BYTE_ADDR(addr_st0, BANK_ID)); `SCOPE_ASSIGN (addr_st1, `LINE_TO_BYTE_ADDR(addr_st1, BANK_ID)); `SCOPE_ASSIGN (addr_st2, `LINE_TO_BYTE_ADDR(addr_st2, BANK_ID)); `SCOPE_ASSIGN (addr_st3, `LINE_TO_BYTE_ADDR(addr_st3, BANK_ID)); `ifdef DBG_PRINT_CACHE_BANK always @(posedge clk) begin if (miss_st3 && (incoming_st0_fill_st3 || incoming_st2_fill_st3)) begin $display("%t: incoming fill - addr=%0h, st0=%b, st1=%b", $time, `LINE_TO_BYTE_ADDR(addr_st3, BANK_ID), incoming_st0_fill_st3, incoming_st2_fill_st3); assert(!is_msrq_st3); end if ((|core_req_valid) && core_req_ready) begin $display("%t: cache%0d:%0d core-req: addr=%0h, tag=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(core_req_addr[0], BANK_ID), core_req_tag); end if (core_rsp_valid && core_rsp_ready) begin $display("%t: cache%0d:%0d core-rsp: tag=%0h, data=%0h", $time, CACHE_ID, BANK_ID, core_rsp_tag, core_rsp_data); end if (dram_req_valid && dram_req_ready) begin $display("%t: cache%0d:%0d dram-req: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_req_addr, BANK_ID), dram_req_data); end if (dram_rsp_valid && dram_rsp_ready) begin $display("%t: cache%0d:%0d dram-rsp: addr=%0h, data=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(dram_rsp_addr, BANK_ID), dram_rsp_data); end if (snp_req_valid && snp_req_ready) begin $display("%t: cache%0d:%0d snp-req: addr=%0h, tag=%0h, invalidate=%0d", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(snp_req_addr, BANK_ID), snp_req_tag, snp_req_invalidate); end if (snp_rsp_valid && snp_rsp_ready) begin $display("%t: cache%0d:%0d snp-rsp: tag=%0h", $time, CACHE_ID, BANK_ID, snp_rsp_tag); end if (msrq_pop) begin $display("%t: cache%0d:%0d msrq-pop: addr=%0h wid=%0d, PC=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st0, BANK_ID), debug_wid_st0, debug_pc_st0); end if (dfpq_pop) begin $display("%t: cache%0d:%0d dfpq-pop: addr=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st0, BANK_ID)); end if (reqq_pop) begin $display("%t: cache%0d:%0d reqq-pop: addr=%0h wid=%0d, PC=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st0, BANK_ID), debug_wid_st0, debug_pc_st0); end if (snrq_pop) begin $display("%t: cache%0d:%0d snrq-pop: addr=%0h tag=%0d", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st0, BANK_ID), snrq_tag_st0); end if (cwbq_push) begin $display("%t: cache%0d:%0d cwbq-push: addr=%0h wid=%0d, PC=%0h", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st3, BANK_ID), debug_wid_st3, debug_pc_st3); end if (dwbq_push) begin $display("%t: cache%0d:%0d dwbq-push: addr=%0h wid=%0d, PC=%0h, rw=%b", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st3, BANK_ID), debug_wid_st3, debug_pc_st3, dwbq_is_dwb_in); end if (snpq_push) begin $display("%t: cache%0d:%0d snpq-push: addr=%0h tag=%0d", $time, CACHE_ID, BANK_ID, `LINE_TO_BYTE_ADDR(addr_st3, BANK_ID), snpq_tag_st3); end end `endif endmodule