performance refactoring - rebalanced stream buffers accross the device to enforce output buffering rule at compoments boudaries, finally resolved block ram R/W collusion discrepencies,
This commit is contained in:
@@ -26,9 +26,7 @@ module VX_dp_ram #(
|
||||
localparam DATA32W = DATAW / 32;
|
||||
localparam BYTEEN32W = BYTEENW / 4;
|
||||
|
||||
//`ifndef QUARTUS
|
||||
|
||||
if (FASTRAM) begin
|
||||
if (FASTRAM) begin
|
||||
if (BUFFERED) begin
|
||||
reg [DATAW-1:0] dout_r;
|
||||
|
||||
@@ -57,72 +55,36 @@ module VX_dp_ram #(
|
||||
dout_r <= mem[raddr];
|
||||
end
|
||||
end
|
||||
|
||||
assign dout = dout_r;
|
||||
|
||||
end else begin
|
||||
|
||||
`UNUSED_VAR (rden)
|
||||
|
||||
if (RWCHECK) begin
|
||||
if (BYTEENW > 1) begin
|
||||
`USE_FAST_BRAM reg [DATA32W-1:0][3:0][7:0] mem [SIZE-1:0];
|
||||
|
||||
if (BYTEENW > 1) begin
|
||||
`USE_FAST_BRAM reg [DATA32W-1:0][3:0][7:0] mem [SIZE-1:0];
|
||||
|
||||
always @(posedge clk) begin
|
||||
if (wren) begin
|
||||
for (integer j = 0; j < BYTEEN32W; j++) begin
|
||||
for (integer i = 0; i < 4; i++) begin
|
||||
if (byteen[j * 4 + i])
|
||||
mem[waddr][j][i] <= din[j * 32 + i * 8 +: 8];
|
||||
end
|
||||
always @(posedge clk) begin
|
||||
if (wren) begin
|
||||
for (integer j = 0; j < BYTEEN32W; j++) begin
|
||||
for (integer i = 0; i < 4; i++) begin
|
||||
if (byteen[j * 4 + i])
|
||||
mem[waddr][j][i] <= din[j * 32 + i * 8 +: 8];
|
||||
end
|
||||
end
|
||||
end
|
||||
assign dout = mem[raddr];
|
||||
|
||||
end else begin
|
||||
`USE_FAST_BRAM reg [DATAW-1:0] mem [SIZE-1:0];
|
||||
|
||||
always @(posedge clk) begin
|
||||
if (wren && byteen)
|
||||
mem[waddr] <= din;
|
||||
end
|
||||
assign dout = mem[raddr];
|
||||
end
|
||||
|
||||
assign dout = mem[raddr];
|
||||
end else begin
|
||||
`USE_FAST_BRAM reg [DATAW-1:0] mem [SIZE-1:0];
|
||||
|
||||
if (BYTEENW > 1) begin
|
||||
`USE_FAST_BRAM `NO_RW_RAM_CHECK reg [DATA32W-1:0][3:0][7:0] mem [SIZE-1:0];
|
||||
|
||||
always @(posedge clk) begin
|
||||
if (wren) begin
|
||||
for (integer j = 0; j < BYTEEN32W; j++) begin
|
||||
for (integer i = 0; i < 4; i++) begin
|
||||
if (byteen[j * 4 + i])
|
||||
mem[waddr][j][i] <= din[j * 32 + i * 8 +: 8];
|
||||
end
|
||||
end
|
||||
end
|
||||
end
|
||||
assign dout = mem[raddr];
|
||||
end else begin
|
||||
`USE_FAST_BRAM `NO_RW_RAM_CHECK reg [DATAW-1:0] mem [SIZE-1:0];
|
||||
|
||||
always @(posedge clk) begin
|
||||
if (wren && byteen)
|
||||
mem[waddr] <= din;
|
||||
end
|
||||
assign dout = mem[raddr];
|
||||
end
|
||||
end
|
||||
always @(posedge clk) begin
|
||||
if (wren && byteen)
|
||||
mem[waddr] <= din;
|
||||
end
|
||||
assign dout = mem[raddr];
|
||||
end
|
||||
end
|
||||
|
||||
end else begin
|
||||
|
||||
if (BUFFERED) begin
|
||||
|
||||
reg [DATAW-1:0] dout_r;
|
||||
|
||||
if (BYTEENW > 1) begin
|
||||
@@ -150,14 +112,11 @@ module VX_dp_ram #(
|
||||
dout_r <= mem[raddr];
|
||||
end
|
||||
end
|
||||
|
||||
assign dout = dout_r;
|
||||
end else begin
|
||||
|
||||
`UNUSED_VAR (rden)
|
||||
|
||||
if (RWCHECK) begin
|
||||
|
||||
if (BYTEENW > 1) begin
|
||||
reg [DATA32W-1:0][3:0][7:0] mem [SIZE-1:0];
|
||||
|
||||
@@ -208,96 +167,6 @@ module VX_dp_ram #(
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
/*`else
|
||||
|
||||
localparam OUTDATA_REG_B = BUFFERED ? "CLOCK0" : "UNREGISTERED";
|
||||
localparam RAM_BLOCK_TYPE = FASTRAM ? "MLAB" : "AUTO";
|
||||
|
||||
if (RWCHECK) begin
|
||||
|
||||
altsyncram #(
|
||||
.init_file (),
|
||||
.operation_mode ("DUAL_PORT"),
|
||||
.numwords_a (SIZE),
|
||||
.numwords_b (SIZE),
|
||||
.widthad_a (ADDRW),
|
||||
.widthad_b (ADDRW),
|
||||
.width_a (DATAW),
|
||||
.width_b (DATAW),
|
||||
.width_byteena_a(BYTEENW),
|
||||
.address_reg_b ("CLOCK0"),
|
||||
.outdata_reg_b (OUTDATA_REG_B),
|
||||
.ram_block_type (RAM_BLOCK_TYPE)
|
||||
) mem (
|
||||
.clocken0 (1'b1),
|
||||
.clocken1 (),
|
||||
.clocken2 (),
|
||||
.clocken3 (),
|
||||
.clock0 (clk),
|
||||
.clock1 (),
|
||||
.address_a (waddr),
|
||||
.address_b (raddr),
|
||||
.byteena_a (byteen),
|
||||
.byteena_b (1'b1),
|
||||
.wren_a (wren),
|
||||
.wren_b (1'b0),
|
||||
.data_a (din),
|
||||
.data_b (),
|
||||
.rden_a (),
|
||||
.rden_b (1'b1),
|
||||
.q_a (),
|
||||
.q_b (dout),
|
||||
.addressstall_a (1'b0),
|
||||
.addressstall_b (1'b0),
|
||||
.aclr0 (1'b0),
|
||||
.aclr1 (1'b0),
|
||||
.eccstatus ()
|
||||
);
|
||||
|
||||
end else begin
|
||||
|
||||
`NO_RW_RAM_CHECK altsyncram #(
|
||||
.init_file (),
|
||||
.operation_mode ("DUAL_PORT"),
|
||||
.numwords_a (SIZE),
|
||||
.numwords_b (SIZE),
|
||||
.widthad_a (ADDRW),
|
||||
.widthad_b (ADDRW),
|
||||
.width_a (DATAW),
|
||||
.width_b (DATAW),
|
||||
.width_byteena_a(BYTEENW),
|
||||
.outdata_reg_b (OUTDATA_REG_B),
|
||||
.ram_block_type (RAM_BLOCK_TYPE)
|
||||
) mem (
|
||||
.clocken0 (1'b1),
|
||||
.clocken1 (1'b1),
|
||||
.clocken2 (1'b1),
|
||||
.clocken3 (1'b1),
|
||||
.clock0 (clk),
|
||||
.clock1 (clk),
|
||||
.address_a (waddr),
|
||||
.address_b (raddr),
|
||||
.byteena_a (byteen),
|
||||
.byteena_b (1'b1),
|
||||
.wren_a (wren),
|
||||
.wren_b (1'b0),
|
||||
.data_a (din),
|
||||
.data_b (),
|
||||
.rden_a (),
|
||||
.rden_b (1'b1),
|
||||
.q_a (),
|
||||
.q_b (dout),
|
||||
.addressstall_a (1'b0),
|
||||
.addressstall_b (1'b0),
|
||||
.aclr0 (1'b0),
|
||||
.aclr1 (1'b0),
|
||||
.eccstatus ()
|
||||
);
|
||||
|
||||
end
|
||||
|
||||
`endif*/
|
||||
|
||||
|
||||
endmodule
|
||||
`TRACING_ON
|
||||
Reference in New Issue
Block a user