mirror of
https://github.com/corundum/corundum.git
synced 2025-01-16 08:12:53 +08:00
8797aa481f
Signed-off-by: Alex Forencich <alex@alexforencich.com>
1855 lines
80 KiB
Verilog
1855 lines
80 KiB
Verilog
/*
|
|
|
|
Copyright (c) 2019-2021 Alex Forencich
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
of this software and associated documentation files (the "Software"), to deal
|
|
in the Software without restriction, including without limitation the rights
|
|
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in
|
|
all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
// Language: Verilog 2001
|
|
|
|
`resetall
|
|
`timescale 1ns / 1ps
|
|
`default_nettype none
|
|
|
|
/*
|
|
* Ultrascale PCIe DMA read interface
|
|
*/
|
|
module dma_if_pcie_us_rd #
|
|
(
|
|
// Width of PCIe AXI stream interfaces in bits
|
|
parameter AXIS_PCIE_DATA_WIDTH = 256,
|
|
// PCIe AXI stream tkeep signal width (words per cycle)
|
|
parameter AXIS_PCIE_KEEP_WIDTH = (AXIS_PCIE_DATA_WIDTH/32),
|
|
// PCIe AXI stream RC tuser signal width
|
|
parameter AXIS_PCIE_RC_USER_WIDTH = AXIS_PCIE_DATA_WIDTH < 512 ? 75 : 161,
|
|
// PCIe AXI stream RQ tuser signal width
|
|
parameter AXIS_PCIE_RQ_USER_WIDTH = AXIS_PCIE_DATA_WIDTH < 512 ? 60 : 137,
|
|
// RQ sequence number width
|
|
parameter RQ_SEQ_NUM_WIDTH = AXIS_PCIE_RQ_USER_WIDTH == 60 ? 4 : 6,
|
|
// RQ sequence number tracking enable
|
|
parameter RQ_SEQ_NUM_ENABLE = 0,
|
|
// RAM select width
|
|
parameter RAM_SEL_WIDTH = 2,
|
|
// RAM address width
|
|
parameter RAM_ADDR_WIDTH = 16,
|
|
// RAM segment count
|
|
parameter SEG_COUNT = AXIS_PCIE_DATA_WIDTH > 64 ? AXIS_PCIE_DATA_WIDTH*2 / 128 : 2,
|
|
// RAM segment data width
|
|
parameter SEG_DATA_WIDTH = AXIS_PCIE_DATA_WIDTH*2/SEG_COUNT,
|
|
// RAM segment byte enable width
|
|
parameter SEG_BE_WIDTH = SEG_DATA_WIDTH/8,
|
|
// RAM segment address width
|
|
parameter SEG_ADDR_WIDTH = RAM_ADDR_WIDTH-$clog2(SEG_COUNT*SEG_BE_WIDTH),
|
|
// PCIe address width
|
|
parameter PCIE_ADDR_WIDTH = 64,
|
|
// PCIe tag count
|
|
parameter PCIE_TAG_COUNT = AXIS_PCIE_RQ_USER_WIDTH == 60 ? 64 : 256,
|
|
// Length field width
|
|
parameter LEN_WIDTH = 16,
|
|
// Tag field width
|
|
parameter TAG_WIDTH = 8,
|
|
// Operation table size
|
|
parameter OP_TABLE_SIZE = PCIE_TAG_COUNT,
|
|
// In-flight transmit limit
|
|
parameter TX_LIMIT = 2**(RQ_SEQ_NUM_WIDTH-1),
|
|
// Transmit flow control
|
|
parameter TX_FC_ENABLE = 0
|
|
)
|
|
(
|
|
input wire clk,
|
|
input wire rst,
|
|
|
|
/*
|
|
* AXI input (RC)
|
|
*/
|
|
input wire [AXIS_PCIE_DATA_WIDTH-1:0] s_axis_rc_tdata,
|
|
input wire [AXIS_PCIE_KEEP_WIDTH-1:0] s_axis_rc_tkeep,
|
|
input wire s_axis_rc_tvalid,
|
|
output wire s_axis_rc_tready,
|
|
input wire s_axis_rc_tlast,
|
|
input wire [AXIS_PCIE_RC_USER_WIDTH-1:0] s_axis_rc_tuser,
|
|
|
|
/*
|
|
* AXI output (RQ)
|
|
*/
|
|
output wire [AXIS_PCIE_DATA_WIDTH-1:0] m_axis_rq_tdata,
|
|
output wire [AXIS_PCIE_KEEP_WIDTH-1:0] m_axis_rq_tkeep,
|
|
output wire m_axis_rq_tvalid,
|
|
input wire m_axis_rq_tready,
|
|
output wire m_axis_rq_tlast,
|
|
output wire [AXIS_PCIE_RQ_USER_WIDTH-1:0] m_axis_rq_tuser,
|
|
|
|
/*
|
|
* Transmit sequence number input
|
|
*/
|
|
input wire [RQ_SEQ_NUM_WIDTH-1:0] s_axis_rq_seq_num_0,
|
|
input wire s_axis_rq_seq_num_valid_0,
|
|
input wire [RQ_SEQ_NUM_WIDTH-1:0] s_axis_rq_seq_num_1,
|
|
input wire s_axis_rq_seq_num_valid_1,
|
|
|
|
/*
|
|
* Transmit flow control
|
|
*/
|
|
input wire [7:0] pcie_tx_fc_nph_av,
|
|
|
|
/*
|
|
* AXI read descriptor input
|
|
*/
|
|
input wire [PCIE_ADDR_WIDTH-1:0] s_axis_read_desc_pcie_addr,
|
|
input wire [RAM_SEL_WIDTH-1:0] s_axis_read_desc_ram_sel,
|
|
input wire [RAM_ADDR_WIDTH-1:0] s_axis_read_desc_ram_addr,
|
|
input wire [LEN_WIDTH-1:0] s_axis_read_desc_len,
|
|
input wire [TAG_WIDTH-1:0] s_axis_read_desc_tag,
|
|
input wire s_axis_read_desc_valid,
|
|
output wire s_axis_read_desc_ready,
|
|
|
|
/*
|
|
* AXI read descriptor status output
|
|
*/
|
|
output wire [TAG_WIDTH-1:0] m_axis_read_desc_status_tag,
|
|
output wire [3:0] m_axis_read_desc_status_error,
|
|
output wire m_axis_read_desc_status_valid,
|
|
|
|
/*
|
|
* RAM interface
|
|
*/
|
|
output wire [SEG_COUNT*RAM_SEL_WIDTH-1:0] ram_wr_cmd_sel,
|
|
output wire [SEG_COUNT*SEG_BE_WIDTH-1:0] ram_wr_cmd_be,
|
|
output wire [SEG_COUNT*SEG_ADDR_WIDTH-1:0] ram_wr_cmd_addr,
|
|
output wire [SEG_COUNT*SEG_DATA_WIDTH-1:0] ram_wr_cmd_data,
|
|
output wire [SEG_COUNT-1:0] ram_wr_cmd_valid,
|
|
input wire [SEG_COUNT-1:0] ram_wr_cmd_ready,
|
|
input wire [SEG_COUNT-1:0] ram_wr_done,
|
|
|
|
/*
|
|
* Configuration
|
|
*/
|
|
input wire enable,
|
|
input wire ext_tag_enable,
|
|
input wire [15:0] requester_id,
|
|
input wire requester_id_enable,
|
|
input wire [2:0] max_read_request_size,
|
|
|
|
/*
|
|
* Status
|
|
*/
|
|
output wire status_error_cor,
|
|
output wire status_error_uncor
|
|
);
|
|
|
|
parameter RAM_WORD_WIDTH = SEG_BE_WIDTH;
|
|
parameter RAM_WORD_SIZE = SEG_DATA_WIDTH/RAM_WORD_WIDTH;
|
|
|
|
parameter AXIS_PCIE_WORD_WIDTH = AXIS_PCIE_KEEP_WIDTH;
|
|
parameter AXIS_PCIE_WORD_SIZE = AXIS_PCIE_DATA_WIDTH/AXIS_PCIE_WORD_WIDTH;
|
|
|
|
parameter OFFSET_WIDTH = $clog2(AXIS_PCIE_DATA_WIDTH/8);
|
|
parameter RAM_OFFSET_WIDTH = $clog2(SEG_COUNT*SEG_DATA_WIDTH/8);
|
|
|
|
parameter PCIE_TAG_WIDTH = $clog2(PCIE_TAG_COUNT);
|
|
parameter PCIE_TAG_COUNT_1 = 2**PCIE_TAG_WIDTH > 32 ? 32 : 2**PCIE_TAG_WIDTH;
|
|
parameter PCIE_TAG_WIDTH_1 = $clog2(PCIE_TAG_COUNT_1);
|
|
parameter PCIE_TAG_COUNT_2 = 2**PCIE_TAG_WIDTH > 32 ? 2**PCIE_TAG_WIDTH-32 : 0;
|
|
parameter PCIE_TAG_WIDTH_2 = $clog2(PCIE_TAG_COUNT_2);
|
|
|
|
parameter OP_TAG_WIDTH = $clog2(OP_TABLE_SIZE);
|
|
parameter OP_TABLE_READ_COUNT_WIDTH = PCIE_TAG_WIDTH+1;
|
|
|
|
parameter STATUS_FIFO_ADDR_WIDTH = 5;
|
|
parameter OUTPUT_FIFO_ADDR_WIDTH = 5;
|
|
|
|
parameter INIT_COUNT_WIDTH = PCIE_TAG_WIDTH > OP_TAG_WIDTH ? PCIE_TAG_WIDTH : OP_TAG_WIDTH;
|
|
|
|
// bus width assertions
|
|
initial begin
|
|
if (AXIS_PCIE_DATA_WIDTH != 64 && AXIS_PCIE_DATA_WIDTH != 128 && AXIS_PCIE_DATA_WIDTH != 256 && AXIS_PCIE_DATA_WIDTH != 512) begin
|
|
$error("Error: PCIe interface width must be 64, 128, or 256 (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (AXIS_PCIE_KEEP_WIDTH * 32 != AXIS_PCIE_DATA_WIDTH) begin
|
|
$error("Error: PCIe interface requires dword (32-bit) granularity (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (AXIS_PCIE_DATA_WIDTH == 512) begin
|
|
if (AXIS_PCIE_RC_USER_WIDTH != 161) begin
|
|
$error("Error: PCIe RC tuser width must be 161 (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (AXIS_PCIE_RQ_USER_WIDTH != 137) begin
|
|
$error("Error: PCIe RQ tuser width must be 137 (instance %m)");
|
|
$finish;
|
|
end
|
|
end else begin
|
|
if (AXIS_PCIE_RC_USER_WIDTH != 75) begin
|
|
$error("Error: PCIe RC tuser width must be 75 (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (AXIS_PCIE_RQ_USER_WIDTH != 60 && AXIS_PCIE_RQ_USER_WIDTH != 62) begin
|
|
$error("Error: PCIe RQ tuser width must be 60 or 62 (instance %m)");
|
|
$finish;
|
|
end
|
|
end
|
|
|
|
if (AXIS_PCIE_RQ_USER_WIDTH == 60) begin
|
|
if (RQ_SEQ_NUM_ENABLE && RQ_SEQ_NUM_WIDTH != 4) begin
|
|
$error("Error: RQ sequence number width must be 4 (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (PCIE_TAG_COUNT > 64) begin
|
|
$error("Error: PCIe tag count must be no larger than 64 (instance %m)");
|
|
$finish;
|
|
end
|
|
end else begin
|
|
if (RQ_SEQ_NUM_ENABLE && RQ_SEQ_NUM_WIDTH != 6) begin
|
|
$error("Error: RQ sequence number width must be 6 (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (PCIE_TAG_COUNT > 256) begin
|
|
$error("Error: PCIe tag count must be no larger than 256 (instance %m)");
|
|
$finish;
|
|
end
|
|
end
|
|
|
|
if (RQ_SEQ_NUM_ENABLE && TX_LIMIT > 2**(RQ_SEQ_NUM_WIDTH-1)) begin
|
|
$error("Error: TX limit out of range (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (SEG_COUNT < 2) begin
|
|
$error("Error: RAM interface requires at least 2 segments (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (SEG_COUNT*SEG_DATA_WIDTH != AXIS_PCIE_DATA_WIDTH*2) begin
|
|
$error("Error: RAM interface width must be double the PCIe interface width (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (SEG_BE_WIDTH * 8 != SEG_DATA_WIDTH) begin
|
|
$error("Error: RAM interface requires byte (8-bit) granularity (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (2**$clog2(RAM_WORD_WIDTH) != RAM_WORD_WIDTH) begin
|
|
$error("Error: RAM word width must be even power of two (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (RAM_ADDR_WIDTH != SEG_ADDR_WIDTH+$clog2(SEG_COUNT)+$clog2(SEG_BE_WIDTH)) begin
|
|
$error("Error: RAM_ADDR_WIDTH does not match RAM configuration (instance %m)");
|
|
$finish;
|
|
end
|
|
|
|
if (PCIE_TAG_COUNT < 1 || PCIE_TAG_COUNT > 256) begin
|
|
$error("Error: PCIe tag count must be between 1 and 256 (instance %m)");
|
|
$finish;
|
|
end
|
|
end
|
|
|
|
localparam [3:0]
|
|
REQ_MEM_READ = 4'b0000,
|
|
REQ_MEM_WRITE = 4'b0001,
|
|
REQ_IO_READ = 4'b0010,
|
|
REQ_IO_WRITE = 4'b0011,
|
|
REQ_MEM_FETCH_ADD = 4'b0100,
|
|
REQ_MEM_SWAP = 4'b0101,
|
|
REQ_MEM_CAS = 4'b0110,
|
|
REQ_MEM_READ_LOCKED = 4'b0111,
|
|
REQ_CFG_READ_0 = 4'b1000,
|
|
REQ_CFG_READ_1 = 4'b1001,
|
|
REQ_CFG_WRITE_0 = 4'b1010,
|
|
REQ_CFG_WRITE_1 = 4'b1011,
|
|
REQ_MSG = 4'b1100,
|
|
REQ_MSG_VENDOR = 4'b1101,
|
|
REQ_MSG_ATS = 4'b1110;
|
|
|
|
localparam [2:0]
|
|
CPL_STATUS_SC = 3'b000, // successful completion
|
|
CPL_STATUS_UR = 3'b001, // unsupported request
|
|
CPL_STATUS_CRS = 3'b010, // configuration request retry status
|
|
CPL_STATUS_CA = 3'b100; // completer abort
|
|
|
|
localparam [3:0]
|
|
RC_ERROR_NORMAL_TERMINATION = 4'b0000,
|
|
RC_ERROR_POISONED = 4'b0001,
|
|
RC_ERROR_BAD_STATUS = 4'b0010,
|
|
RC_ERROR_INVALID_LENGTH = 4'b0011,
|
|
RC_ERROR_MISMATCH = 4'b0100,
|
|
RC_ERROR_INVALID_ADDRESS = 4'b0101,
|
|
RC_ERROR_INVALID_TAG = 4'b0110,
|
|
RC_ERROR_TIMEOUT = 4'b1001,
|
|
RC_ERROR_FLR = 4'b1000;
|
|
|
|
localparam [3:0]
|
|
DMA_ERROR_NONE = 4'd0,
|
|
DMA_ERROR_TIMEOUT = 4'd1,
|
|
DMA_ERROR_PARITY = 4'd2,
|
|
DMA_ERROR_AXI_RD_SLVERR = 4'd4,
|
|
DMA_ERROR_AXI_RD_DECERR = 4'd5,
|
|
DMA_ERROR_AXI_WR_SLVERR = 4'd6,
|
|
DMA_ERROR_AXI_WR_DECERR = 4'd7,
|
|
DMA_ERROR_PCIE_FLR = 4'd8,
|
|
DMA_ERROR_PCIE_CPL_POISONED = 4'd9,
|
|
DMA_ERROR_PCIE_CPL_STATUS_UR = 4'd10,
|
|
DMA_ERROR_PCIE_CPL_STATUS_CA = 4'd11;
|
|
|
|
localparam [1:0]
|
|
REQ_STATE_IDLE = 2'd0,
|
|
REQ_STATE_START = 2'd1,
|
|
REQ_STATE_HEADER = 2'd2;
|
|
|
|
reg [1:0] req_state_reg = REQ_STATE_IDLE, req_state_next;
|
|
|
|
localparam [1:0]
|
|
TLP_STATE_IDLE = 2'd0,
|
|
TLP_STATE_HEADER = 2'd1,
|
|
TLP_STATE_WRITE = 2'd2,
|
|
TLP_STATE_WAIT_END = 2'd3;
|
|
|
|
reg [1:0] tlp_state_reg = TLP_STATE_IDLE, tlp_state_next;
|
|
|
|
// datapath control signals
|
|
reg last_cycle;
|
|
|
|
reg [3:0] first_be;
|
|
reg [3:0] last_be;
|
|
reg [10:0] dword_count;
|
|
reg req_last_tlp;
|
|
reg [PCIE_ADDR_WIDTH-1:0] req_pcie_addr;
|
|
|
|
reg [INIT_COUNT_WIDTH-1:0] init_count_reg = 0;
|
|
reg init_done_reg = 1'b0;
|
|
reg init_pcie_tag_reg = 1'b1;
|
|
reg init_op_tag_reg = 1'b1;
|
|
|
|
reg [PCIE_ADDR_WIDTH-1:0] req_pcie_addr_reg = {PCIE_ADDR_WIDTH{1'b0}}, req_pcie_addr_next;
|
|
reg [RAM_SEL_WIDTH-1:0] req_ram_sel_reg = {RAM_SEL_WIDTH{1'b0}}, req_ram_sel_next;
|
|
reg [RAM_ADDR_WIDTH-1:0] req_ram_addr_reg = {RAM_ADDR_WIDTH{1'b0}}, req_ram_addr_next;
|
|
reg [LEN_WIDTH-1:0] req_op_count_reg = {LEN_WIDTH{1'b0}}, req_op_count_next;
|
|
reg [12:0] req_tlp_count_reg = 13'd0, req_tlp_count_next;
|
|
reg req_zero_len_reg = 1'b0, req_zero_len_next;
|
|
reg [OP_TAG_WIDTH-1:0] req_op_tag_reg = {OP_TAG_WIDTH{1'b0}}, req_op_tag_next;
|
|
reg req_op_tag_valid_reg = 1'b0, req_op_tag_valid_next;
|
|
reg [PCIE_TAG_WIDTH-1:0] req_pcie_tag_reg = {PCIE_TAG_WIDTH{1'b0}}, req_pcie_tag_next;
|
|
reg req_pcie_tag_valid_reg = 1'b0, req_pcie_tag_valid_next;
|
|
|
|
reg [11:0] lower_addr_reg = 12'd0, lower_addr_next;
|
|
reg [12:0] byte_count_reg = 13'd0, byte_count_next;
|
|
reg [3:0] error_code_reg = 4'd0, error_code_next;
|
|
reg [RAM_SEL_WIDTH-1:0] ram_sel_reg = {RAM_SEL_WIDTH{1'b0}}, ram_sel_next;
|
|
reg [RAM_ADDR_WIDTH-1:0] addr_reg = {RAM_ADDR_WIDTH{1'b0}}, addr_next;
|
|
reg [RAM_ADDR_WIDTH-1:0] addr_delay_reg = {RAM_ADDR_WIDTH{1'b0}}, addr_delay_next;
|
|
reg [10:0] op_dword_count_reg = 11'd0, op_dword_count_next;
|
|
reg [12:0] op_count_reg = 13'd0, op_count_next;
|
|
reg zero_len_reg = 1'b0, zero_len_next;
|
|
reg [SEG_COUNT-1:0] ram_mask_reg = {SEG_COUNT{1'b0}}, ram_mask_next;
|
|
reg [SEG_COUNT-1:0] ram_mask_0_reg = {SEG_COUNT{1'b0}}, ram_mask_0_next;
|
|
reg [SEG_COUNT-1:0] ram_mask_1_reg = {SEG_COUNT{1'b0}}, ram_mask_1_next;
|
|
reg ram_wrap_reg = 1'b0, ram_wrap_next;
|
|
reg [OFFSET_WIDTH+1-1:0] cycle_byte_count_reg = {OFFSET_WIDTH+1{1'b0}}, cycle_byte_count_next;
|
|
reg [RAM_OFFSET_WIDTH-1:0] start_offset_reg = {RAM_OFFSET_WIDTH{1'b0}}, start_offset_next;
|
|
reg [RAM_OFFSET_WIDTH-1:0] end_offset_reg = {RAM_OFFSET_WIDTH{1'b0}}, end_offset_next;
|
|
reg [2:0] cpl_status_reg = 3'b000, cpl_status_next;
|
|
reg [PCIE_TAG_WIDTH-1:0] pcie_tag_reg = {PCIE_TAG_WIDTH{1'b0}}, pcie_tag_next;
|
|
reg [OP_TAG_WIDTH-1:0] op_tag_reg = {OP_TAG_WIDTH{1'b0}}, op_tag_next;
|
|
reg final_cpl_reg = 1'b0, final_cpl_next;
|
|
reg finish_tag_reg = 1'b0, finish_tag_next;
|
|
|
|
reg [OFFSET_WIDTH-1:0] offset_reg = {OFFSET_WIDTH{1'b0}}, offset_next;
|
|
|
|
reg [AXIS_PCIE_DATA_WIDTH-1:0] rc_tdata_int_reg = {AXIS_PCIE_DATA_WIDTH{1'b0}}, rc_tdata_int_next;
|
|
reg rc_tvalid_int_reg = 1'b0, rc_tvalid_int_next;
|
|
|
|
reg [127:0] tlp_header_data;
|
|
reg [AXIS_PCIE_RQ_USER_WIDTH-1:0] tlp_tuser;
|
|
|
|
reg [10:0] max_read_request_size_dw_reg = 11'd0;
|
|
|
|
reg have_credit_reg = 1'b0;
|
|
|
|
reg [STATUS_FIFO_ADDR_WIDTH+1-1:0] status_fifo_wr_ptr_reg = 0;
|
|
reg [STATUS_FIFO_ADDR_WIDTH+1-1:0] status_fifo_rd_ptr_reg = 0;
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [OP_TAG_WIDTH-1:0] status_fifo_op_tag[(2**STATUS_FIFO_ADDR_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [SEG_COUNT-1:0] status_fifo_mask[(2**STATUS_FIFO_ADDR_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg status_fifo_finish[(2**STATUS_FIFO_ADDR_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [3:0] status_fifo_error[(2**STATUS_FIFO_ADDR_WIDTH)-1:0];
|
|
reg [OP_TAG_WIDTH-1:0] status_fifo_wr_op_tag;
|
|
reg [SEG_COUNT-1:0] status_fifo_wr_mask;
|
|
reg status_fifo_wr_finish;
|
|
reg [3:0] status_fifo_wr_error;
|
|
reg status_fifo_wr_en;
|
|
reg status_fifo_mask_reg = 1'b0, status_fifo_mask_next;
|
|
reg status_fifo_finish_reg = 1'b0, status_fifo_finish_next;
|
|
reg [3:0] status_fifo_error_reg = 4'd0, status_fifo_error_next;
|
|
reg status_fifo_wr_en_reg = 1'b0, status_fifo_wr_en_next;
|
|
reg status_fifo_half_full_reg = 1'b0;
|
|
reg status_fifo_rd_en;
|
|
reg [OP_TAG_WIDTH-1:0] status_fifo_rd_op_tag_reg = 0;
|
|
reg [SEG_COUNT-1:0] status_fifo_rd_mask_reg = 0;
|
|
reg status_fifo_rd_finish_reg = 1'b0;
|
|
reg [3:0] status_fifo_rd_error_reg = 4'd0;
|
|
reg status_fifo_rd_valid_reg = 1'b0, status_fifo_rd_valid_next;
|
|
|
|
reg [RQ_SEQ_NUM_WIDTH-1:0] active_tx_count_reg = {RQ_SEQ_NUM_WIDTH{1'b0}};
|
|
reg active_tx_count_av_reg = 1'b1;
|
|
reg inc_active_tx;
|
|
|
|
reg s_axis_rc_tready_reg = 1'b0, s_axis_rc_tready_next;
|
|
reg s_axis_read_desc_ready_reg = 1'b0, s_axis_read_desc_ready_next;
|
|
|
|
reg [TAG_WIDTH-1:0] m_axis_read_desc_status_tag_reg = {TAG_WIDTH{1'b0}}, m_axis_read_desc_status_tag_next;
|
|
reg [3:0] m_axis_read_desc_status_error_reg = 4'd0, m_axis_read_desc_status_error_next;
|
|
reg m_axis_read_desc_status_valid_reg = 1'b0, m_axis_read_desc_status_valid_next;
|
|
|
|
reg status_error_cor_reg = 1'b0, status_error_cor_next;
|
|
reg status_error_uncor_reg = 1'b0, status_error_uncor_next;
|
|
|
|
// internal datapath
|
|
reg [AXIS_PCIE_DATA_WIDTH-1:0] m_axis_rq_tdata_int;
|
|
reg [AXIS_PCIE_KEEP_WIDTH-1:0] m_axis_rq_tkeep_int;
|
|
reg m_axis_rq_tvalid_int;
|
|
reg m_axis_rq_tready_int_reg = 1'b0;
|
|
reg m_axis_rq_tlast_int;
|
|
reg [AXIS_PCIE_RQ_USER_WIDTH-1:0] m_axis_rq_tuser_int;
|
|
wire m_axis_rq_tready_int_early;
|
|
|
|
reg [SEG_COUNT*RAM_SEL_WIDTH-1:0] ram_wr_cmd_sel_int;
|
|
reg [SEG_COUNT*SEG_BE_WIDTH-1:0] ram_wr_cmd_be_int;
|
|
reg [SEG_COUNT*SEG_ADDR_WIDTH-1:0] ram_wr_cmd_addr_int;
|
|
reg [SEG_COUNT*SEG_DATA_WIDTH-1:0] ram_wr_cmd_data_int;
|
|
reg [SEG_COUNT-1:0] ram_wr_cmd_valid_int;
|
|
wire [SEG_COUNT-1:0] ram_wr_cmd_ready_int;
|
|
|
|
wire [SEG_COUNT-1:0] out_done;
|
|
reg [SEG_COUNT-1:0] out_done_ack;
|
|
|
|
assign s_axis_rc_tready = s_axis_rc_tready_reg;
|
|
assign s_axis_read_desc_ready = s_axis_read_desc_ready_reg;
|
|
|
|
assign m_axis_read_desc_status_tag = m_axis_read_desc_status_tag_reg;
|
|
assign m_axis_read_desc_status_error = m_axis_read_desc_status_error_reg;
|
|
assign m_axis_read_desc_status_valid = m_axis_read_desc_status_valid_reg;
|
|
|
|
assign status_error_cor = status_error_cor_reg;
|
|
assign status_error_uncor = status_error_uncor_reg;
|
|
|
|
// PCIe tag management
|
|
reg [PCIE_TAG_WIDTH-1:0] pcie_tag_table_start_ptr_reg = 0, pcie_tag_table_start_ptr_next;
|
|
reg [RAM_SEL_WIDTH-1:0] pcie_tag_table_start_ram_sel_reg = 0, pcie_tag_table_start_ram_sel_next;
|
|
reg [RAM_ADDR_WIDTH-1:0] pcie_tag_table_start_ram_addr_reg = 0, pcie_tag_table_start_ram_addr_next;
|
|
reg [OP_TAG_WIDTH-1:0] pcie_tag_table_start_op_tag_reg = 0, pcie_tag_table_start_op_tag_next;
|
|
reg pcie_tag_table_start_zero_len_reg = 1'b0, pcie_tag_table_start_zero_len_next;
|
|
reg pcie_tag_table_start_en_reg = 1'b0, pcie_tag_table_start_en_next;
|
|
reg [PCIE_TAG_WIDTH-1:0] pcie_tag_table_finish_ptr;
|
|
reg pcie_tag_table_finish_en;
|
|
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [RAM_SEL_WIDTH-1:0] pcie_tag_table_ram_sel[(2**PCIE_TAG_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [RAM_ADDR_WIDTH-1:0] pcie_tag_table_ram_addr[(2**PCIE_TAG_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [OP_TAG_WIDTH-1:0] pcie_tag_table_op_tag[(2**PCIE_TAG_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg pcie_tag_table_zero_len[(2**PCIE_TAG_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg pcie_tag_table_active_a[(2**PCIE_TAG_WIDTH)-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg pcie_tag_table_active_b[(2**PCIE_TAG_WIDTH)-1:0];
|
|
|
|
reg [PCIE_TAG_WIDTH-1:0] pcie_tag_fifo_wr_tag;
|
|
|
|
reg [PCIE_TAG_WIDTH_1+1-1:0] pcie_tag_fifo_1_wr_ptr_reg = 0;
|
|
reg [PCIE_TAG_WIDTH_1+1-1:0] pcie_tag_fifo_1_rd_ptr_reg = 0, pcie_tag_fifo_1_rd_ptr_next;
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [PCIE_TAG_WIDTH_1-1:0] pcie_tag_fifo_1_mem [2**PCIE_TAG_WIDTH_1-1:0];
|
|
reg pcie_tag_fifo_1_we;
|
|
|
|
reg [PCIE_TAG_WIDTH_2+1-1:0] pcie_tag_fifo_2_wr_ptr_reg = 0;
|
|
reg [PCIE_TAG_WIDTH_2+1-1:0] pcie_tag_fifo_2_rd_ptr_reg = 0, pcie_tag_fifo_2_rd_ptr_next;
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [PCIE_TAG_WIDTH-1:0] pcie_tag_fifo_2_mem [2**PCIE_TAG_WIDTH_2-1:0];
|
|
reg pcie_tag_fifo_2_we;
|
|
|
|
// operation tag management
|
|
reg [OP_TAG_WIDTH-1:0] op_table_start_ptr;
|
|
reg [TAG_WIDTH-1:0] op_table_start_tag;
|
|
reg op_table_start_en;
|
|
reg [OP_TAG_WIDTH-1:0] op_table_read_start_ptr;
|
|
reg op_table_read_start_commit;
|
|
reg op_table_read_start_en;
|
|
reg [OP_TAG_WIDTH-1:0] op_table_update_status_ptr;
|
|
reg [3:0] op_table_update_status_error;
|
|
reg op_table_update_status_en;
|
|
reg [OP_TAG_WIDTH-1:0] op_table_read_finish_ptr;
|
|
reg op_table_read_finish_en;
|
|
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [TAG_WIDTH-1:0] op_table_tag [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg op_table_read_init_a [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg op_table_read_init_b [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg op_table_read_commit [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [OP_TABLE_READ_COUNT_WIDTH-1:0] op_table_read_count_start [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [OP_TABLE_READ_COUNT_WIDTH-1:0] op_table_read_count_finish [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg op_table_error_a [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg op_table_error_b [2**OP_TAG_WIDTH-1:0];
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [3:0] op_table_error_code [2**OP_TAG_WIDTH-1:0];
|
|
|
|
reg [OP_TAG_WIDTH+1-1:0] op_tag_fifo_wr_ptr_reg = 0;
|
|
reg [OP_TAG_WIDTH+1-1:0] op_tag_fifo_rd_ptr_reg = 0, op_tag_fifo_rd_ptr_next;
|
|
(* ram_style = "distributed", ramstyle = "no_rw_check, mlab" *)
|
|
reg [OP_TAG_WIDTH-1:0] op_tag_fifo_mem [2**OP_TAG_WIDTH-1:0];
|
|
reg [OP_TAG_WIDTH-1:0] op_tag_fifo_wr_tag;
|
|
reg op_tag_fifo_we;
|
|
|
|
integer i;
|
|
|
|
initial begin
|
|
for (i = 0; i < 2**OP_TAG_WIDTH; i = i + 1) begin
|
|
op_table_tag[i] = 0;
|
|
op_table_read_init_a[i] = 0;
|
|
op_table_read_init_b[i] = 0;
|
|
op_table_read_commit[i] = 0;
|
|
op_table_read_count_start[i] = 0;
|
|
op_table_read_count_finish[i] = 0;
|
|
op_table_error_a[i] = 0;
|
|
op_table_error_b[i] = 0;
|
|
op_table_error_code[i] = 0;
|
|
end
|
|
|
|
for (i = 0; i < 2**PCIE_TAG_WIDTH; i = i + 1) begin
|
|
pcie_tag_table_ram_sel[i] = 0;
|
|
pcie_tag_table_ram_addr[i] = 0;
|
|
pcie_tag_table_op_tag[i] = 0;
|
|
pcie_tag_table_zero_len[i] = 0;
|
|
pcie_tag_table_active_a[i] = 0;
|
|
pcie_tag_table_active_b[i] = 0;
|
|
end
|
|
end
|
|
|
|
always @* begin
|
|
req_state_next = REQ_STATE_IDLE;
|
|
|
|
s_axis_read_desc_ready_next = 1'b0;
|
|
|
|
req_pcie_addr_next = req_pcie_addr_reg;
|
|
req_ram_sel_next = req_ram_sel_reg;
|
|
req_ram_addr_next = req_ram_addr_reg;
|
|
req_op_count_next = req_op_count_reg;
|
|
req_tlp_count_next = req_tlp_count_reg;
|
|
req_zero_len_next = req_zero_len_reg;
|
|
req_op_tag_next = req_op_tag_reg;
|
|
req_op_tag_valid_next = req_op_tag_valid_reg;
|
|
req_pcie_tag_next = req_pcie_tag_reg;
|
|
req_pcie_tag_valid_next = req_pcie_tag_valid_reg;
|
|
|
|
inc_active_tx = 1'b0;
|
|
|
|
op_table_start_ptr = req_op_tag_reg;
|
|
op_table_start_tag = s_axis_read_desc_tag;
|
|
op_table_start_en = 1'b0;
|
|
|
|
op_table_read_start_ptr = req_op_tag_reg;
|
|
op_table_read_start_commit = 1'b0;
|
|
op_table_read_start_en = 1'b0;
|
|
|
|
// TLP size computation
|
|
if (req_op_count_reg + req_pcie_addr_reg[1:0] <= {max_read_request_size_dw_reg, 2'b00}) begin
|
|
// packet smaller than max read request size
|
|
if (((req_pcie_addr_reg & 12'hfff) + (req_op_count_reg & 12'hfff)) >> 12 != 0 || req_op_count_reg >> 12 != 0) begin
|
|
// crosses 4k boundary, split on 4K boundary
|
|
req_tlp_count_next = 13'h1000 - req_pcie_addr_reg[11:0];
|
|
dword_count = 11'h400 - req_pcie_addr_reg[11:2];
|
|
req_last_tlp = (((req_pcie_addr_reg & 12'hfff) + (req_op_count_reg & 12'hfff)) & 12'hfff) == 0 && req_op_count_reg >> 12 == 0;
|
|
// optimized req_pcie_addr = req_pcie_addr_reg + req_tlp_count_next
|
|
req_pcie_addr[PCIE_ADDR_WIDTH-1:12] = req_pcie_addr_reg[PCIE_ADDR_WIDTH-1:12]+1;
|
|
req_pcie_addr[11:0] = 12'd0;
|
|
end else begin
|
|
// does not cross 4k boundary, send one TLP
|
|
req_tlp_count_next = req_op_count_reg;
|
|
dword_count = (req_op_count_reg + req_pcie_addr_reg[1:0] + 3) >> 2;
|
|
req_last_tlp = 1'b1;
|
|
// always last TLP, so next address is irrelevant
|
|
req_pcie_addr[PCIE_ADDR_WIDTH-1:12] = req_pcie_addr_reg[PCIE_ADDR_WIDTH-1:12];
|
|
req_pcie_addr[11:0] = 12'd0;
|
|
end
|
|
end else begin
|
|
// packet larger than max read request size
|
|
if (((req_pcie_addr_reg & 12'hfff) + {max_read_request_size_dw_reg, 2'b00}) >> 12 != 0) begin
|
|
// crosses 4k boundary, split on 4K boundary
|
|
req_tlp_count_next = 13'h1000 - req_pcie_addr_reg[11:0];
|
|
dword_count = 11'h400 - req_pcie_addr_reg[11:2];
|
|
req_last_tlp = 1'b0;
|
|
// optimized req_pcie_addr = req_pcie_addr_reg + req_tlp_count_next
|
|
req_pcie_addr[PCIE_ADDR_WIDTH-1:12] = req_pcie_addr_reg[PCIE_ADDR_WIDTH-1:12]+1;
|
|
req_pcie_addr[11:0] = 12'd0;
|
|
end else begin
|
|
// does not cross 4k boundary, split on 128-byte read completion boundary
|
|
req_tlp_count_next = {max_read_request_size_dw_reg, 2'b00} - req_pcie_addr_reg[6:0];
|
|
dword_count = max_read_request_size_dw_reg - req_pcie_addr_reg[6:2];
|
|
req_last_tlp = 1'b0;
|
|
// optimized req_pcie_addr = req_pcie_addr_reg + req_tlp_count_next
|
|
req_pcie_addr[PCIE_ADDR_WIDTH-1:12] = req_pcie_addr_reg[PCIE_ADDR_WIDTH-1:12];
|
|
req_pcie_addr[11:0] = {{req_pcie_addr_reg[11:7], 5'd0} + max_read_request_size_dw_reg, 2'b00};
|
|
end
|
|
end
|
|
|
|
pcie_tag_table_start_ptr_next = req_pcie_tag_reg;
|
|
pcie_tag_table_start_ram_sel_next = req_ram_sel_reg;
|
|
pcie_tag_table_start_ram_addr_next = req_ram_addr_reg + req_tlp_count_next;
|
|
pcie_tag_table_start_op_tag_next = req_op_tag_reg;
|
|
pcie_tag_table_start_zero_len_next = req_zero_len_reg;
|
|
pcie_tag_table_start_en_next = 1'b0;
|
|
|
|
first_be = 4'b1111 << req_pcie_addr_reg[1:0];
|
|
last_be = 4'b1111 >> (3 - ((req_pcie_addr_reg[1:0] + req_tlp_count_next[1:0] - 1) & 3));
|
|
|
|
// TLP header and sideband data
|
|
tlp_header_data[1:0] = 2'b0; // address type
|
|
tlp_header_data[63:2] = req_pcie_addr_reg[PCIE_ADDR_WIDTH-1:2]; // address
|
|
tlp_header_data[74:64] = dword_count; // DWORD count
|
|
tlp_header_data[78:75] = REQ_MEM_READ; // request type - memory read
|
|
tlp_header_data[79] = 1'b0; // poisoned request
|
|
tlp_header_data[95:80] = requester_id;
|
|
tlp_header_data[103:96] = req_pcie_tag_reg;
|
|
tlp_header_data[119:104] = 16'd0; // completer ID
|
|
tlp_header_data[120] = requester_id_enable;
|
|
tlp_header_data[123:121] = 3'b000; // traffic class
|
|
tlp_header_data[126:124] = 3'b000; // attr
|
|
tlp_header_data[127] = 1'b0; // force ECRC
|
|
|
|
if (AXIS_PCIE_DATA_WIDTH == 512) begin
|
|
tlp_tuser[3:0] = req_zero_len_reg ? 4'b0000 : (dword_count == 1 ? first_be & last_be : first_be); // first BE 0
|
|
tlp_tuser[7:4] = 4'd0; // first BE 1
|
|
tlp_tuser[11:8] = req_zero_len_reg ? 4'b0000 : (dword_count == 1 ? 4'b0000 : last_be); // last BE 0
|
|
tlp_tuser[15:12] = 4'd0; // last BE 1
|
|
tlp_tuser[19:16] = 3'd0; // addr_offset
|
|
tlp_tuser[21:20] = 2'b01; // is_sop
|
|
tlp_tuser[23:22] = 2'd0; // is_sop0_ptr
|
|
tlp_tuser[25:24] = 2'd0; // is_sop1_ptr
|
|
tlp_tuser[27:26] = 2'b01; // is_eop
|
|
tlp_tuser[31:28] = 4'd3; // is_eop0_ptr
|
|
tlp_tuser[35:32] = 4'd0; // is_eop1_ptr
|
|
tlp_tuser[36] = 1'b0; // discontinue
|
|
tlp_tuser[38:37] = 2'b00; // tph_present
|
|
tlp_tuser[42:39] = 4'b0000; // tph_type
|
|
tlp_tuser[44:43] = 2'b00; // tph_indirect_tag_en
|
|
tlp_tuser[60:45] = 16'd0; // tph_st_tag
|
|
tlp_tuser[66:61] = 6'd0; // seq_num0
|
|
tlp_tuser[72:67] = 6'd0; // seq_num1
|
|
tlp_tuser[136:73] = 64'd0; // parity
|
|
end else begin
|
|
tlp_tuser[3:0] = req_zero_len_reg ? 4'b0000 : (dword_count == 1 ? first_be & last_be : first_be); // first BE
|
|
tlp_tuser[7:4] = req_zero_len_reg ? 4'b0000 : (dword_count == 1 ? 4'b0000 : last_be); // last BE
|
|
tlp_tuser[10:8] = 3'd0; // addr_offset
|
|
tlp_tuser[11] = 1'b0; // discontinue
|
|
tlp_tuser[12] = 1'b0; // tph_present
|
|
tlp_tuser[14:13] = 2'b00; // tph_type
|
|
tlp_tuser[15] = 1'b0; // tph_indirect_tag_en
|
|
tlp_tuser[23:16] = 8'd0; // tph_st_tag
|
|
tlp_tuser[27:24] = 4'd0; // seq_num
|
|
tlp_tuser[59:28] = 32'd0; // parity
|
|
if (AXIS_PCIE_RQ_USER_WIDTH == 62) begin
|
|
tlp_tuser[61:60] = 2'd0; // seq_num
|
|
end
|
|
end
|
|
|
|
if (AXIS_PCIE_DATA_WIDTH == 512) begin
|
|
m_axis_rq_tdata_int = tlp_header_data;
|
|
m_axis_rq_tkeep_int = 16'b0000000000001111;
|
|
m_axis_rq_tlast_int = 1'b1;
|
|
end else if (AXIS_PCIE_DATA_WIDTH == 256) begin
|
|
m_axis_rq_tdata_int = tlp_header_data;
|
|
m_axis_rq_tkeep_int = 8'b00001111;
|
|
m_axis_rq_tlast_int = 1'b1;
|
|
end else if (AXIS_PCIE_DATA_WIDTH == 128) begin
|
|
m_axis_rq_tdata_int = tlp_header_data;
|
|
m_axis_rq_tkeep_int = 4'b1111;
|
|
m_axis_rq_tlast_int = 1'b1;
|
|
end else if (AXIS_PCIE_DATA_WIDTH == 64) begin
|
|
m_axis_rq_tdata_int = tlp_header_data[63:0];
|
|
m_axis_rq_tkeep_int = 2'b11;
|
|
m_axis_rq_tlast_int = 1'b0;
|
|
end
|
|
m_axis_rq_tvalid_int = 1'b0;
|
|
m_axis_rq_tuser_int = tlp_tuser;
|
|
|
|
// TLP segmentation and request generation
|
|
case (req_state_reg)
|
|
REQ_STATE_IDLE: begin
|
|
s_axis_read_desc_ready_next = init_done_reg && enable && req_op_tag_valid_reg;
|
|
|
|
if (s_axis_read_desc_ready && s_axis_read_desc_valid) begin
|
|
s_axis_read_desc_ready_next = 1'b0;
|
|
req_ram_sel_next = s_axis_read_desc_ram_sel;
|
|
req_pcie_addr_next = s_axis_read_desc_pcie_addr;
|
|
req_ram_addr_next = s_axis_read_desc_ram_addr;
|
|
if (s_axis_read_desc_len == 0) begin
|
|
// zero-length operation
|
|
req_op_count_next = 1;
|
|
req_zero_len_next = 1'b1;
|
|
end else begin
|
|
req_op_count_next = s_axis_read_desc_len;
|
|
req_zero_len_next = 1'b0;
|
|
end
|
|
op_table_start_ptr = req_op_tag_reg;
|
|
op_table_start_tag = s_axis_read_desc_tag;
|
|
op_table_start_en = 1'b1;
|
|
req_state_next = REQ_STATE_START;
|
|
end else begin
|
|
req_state_next = REQ_STATE_IDLE;
|
|
end
|
|
end
|
|
REQ_STATE_START: begin
|
|
if (m_axis_rq_tready_int_reg && req_pcie_tag_valid_reg && (!TX_FC_ENABLE || have_credit_reg) && (!RQ_SEQ_NUM_ENABLE || active_tx_count_av_reg)) begin
|
|
m_axis_rq_tvalid_int = 1'b1;
|
|
|
|
inc_active_tx = 1'b1;
|
|
|
|
if (AXIS_PCIE_DATA_WIDTH > 64) begin
|
|
req_pcie_addr_next = req_pcie_addr;
|
|
req_ram_addr_next = req_ram_addr_reg + req_tlp_count_next;
|
|
req_op_count_next = req_op_count_reg - req_tlp_count_next;
|
|
|
|
pcie_tag_table_start_ptr_next = req_pcie_tag_reg;
|
|
pcie_tag_table_start_ram_sel_next = req_ram_sel_reg;
|
|
pcie_tag_table_start_ram_addr_next = req_ram_addr_reg + req_tlp_count_next;
|
|
pcie_tag_table_start_op_tag_next = req_op_tag_reg;
|
|
pcie_tag_table_start_zero_len_next = req_zero_len_reg;
|
|
pcie_tag_table_start_en_next = 1'b1;
|
|
|
|
op_table_read_start_ptr = req_op_tag_reg;
|
|
op_table_read_start_commit = req_last_tlp;
|
|
op_table_read_start_en = 1'b1;
|
|
|
|
req_pcie_tag_valid_next = 1'b0;
|
|
|
|
if (!req_last_tlp) begin
|
|
req_state_next = REQ_STATE_START;
|
|
end else begin
|
|
req_op_tag_valid_next = 1'b0;
|
|
s_axis_read_desc_ready_next = init_done_reg && enable && (op_tag_fifo_rd_ptr_reg != op_tag_fifo_wr_ptr_reg);
|
|
req_state_next = REQ_STATE_IDLE;
|
|
end
|
|
end else begin
|
|
req_state_next = REQ_STATE_HEADER;
|
|
end
|
|
end else begin
|
|
req_state_next = REQ_STATE_START;
|
|
end
|
|
end
|
|
REQ_STATE_HEADER: begin
|
|
if (AXIS_PCIE_DATA_WIDTH == 64) begin
|
|
m_axis_rq_tdata_int = tlp_header_data[127:64];
|
|
m_axis_rq_tkeep_int = 2'b11;
|
|
m_axis_rq_tlast_int = 1'b1;
|
|
|
|
if (m_axis_rq_tready_int_reg && req_pcie_tag_valid_reg) begin
|
|
req_pcie_addr_next = req_pcie_addr;
|
|
req_ram_addr_next = req_ram_addr_reg + req_tlp_count_next;
|
|
req_op_count_next = req_op_count_reg - req_tlp_count_next;
|
|
|
|
m_axis_rq_tvalid_int = 1'b1;
|
|
|
|
pcie_tag_table_start_ptr_next = req_pcie_tag_reg;
|
|
pcie_tag_table_start_ram_sel_next = req_ram_sel_reg;
|
|
pcie_tag_table_start_ram_addr_next = req_ram_addr_reg + req_tlp_count_next;
|
|
pcie_tag_table_start_op_tag_next = req_op_tag_reg;
|
|
pcie_tag_table_start_zero_len_next = req_zero_len_reg;
|
|
pcie_tag_table_start_en_next = 1'b1;
|
|
|
|
op_table_read_start_ptr = req_op_tag_reg;
|
|
op_table_read_start_commit = req_last_tlp;
|
|
op_table_read_start_en = 1'b1;
|
|
|
|
req_pcie_tag_valid_next = 1'b0;
|
|
|
|
if (!req_last_tlp) begin
|
|
req_state_next = REQ_STATE_START;
|
|
end else begin
|
|
req_op_tag_valid_next = 1'b0;
|
|
s_axis_read_desc_ready_next = init_done_reg && enable && (op_tag_fifo_rd_ptr_reg != op_tag_fifo_wr_ptr_reg);
|
|
req_state_next = REQ_STATE_IDLE;
|
|
end
|
|
end else begin
|
|
req_state_next = REQ_STATE_HEADER;
|
|
end
|
|
end
|
|
end
|
|
endcase
|
|
|
|
op_tag_fifo_rd_ptr_next = op_tag_fifo_rd_ptr_reg;
|
|
|
|
if (!req_op_tag_valid_next) begin
|
|
if (op_tag_fifo_rd_ptr_reg != op_tag_fifo_wr_ptr_reg) begin
|
|
req_op_tag_next = op_tag_fifo_mem[op_tag_fifo_rd_ptr_reg[OP_TAG_WIDTH-1:0]];
|
|
req_op_tag_valid_next = 1'b1;
|
|
op_tag_fifo_rd_ptr_next = op_tag_fifo_rd_ptr_reg + 1;
|
|
end
|
|
end
|
|
|
|
pcie_tag_fifo_1_rd_ptr_next = pcie_tag_fifo_1_rd_ptr_reg;
|
|
pcie_tag_fifo_2_rd_ptr_next = pcie_tag_fifo_2_rd_ptr_reg;
|
|
|
|
if (!req_pcie_tag_valid_next) begin
|
|
if (pcie_tag_fifo_1_rd_ptr_reg != pcie_tag_fifo_1_wr_ptr_reg) begin
|
|
req_pcie_tag_next = pcie_tag_fifo_1_mem[pcie_tag_fifo_1_rd_ptr_reg[PCIE_TAG_WIDTH_1-1:0]];
|
|
req_pcie_tag_valid_next = 1'b1;
|
|
pcie_tag_fifo_1_rd_ptr_next = pcie_tag_fifo_1_rd_ptr_reg + 1;
|
|
end else if (PCIE_TAG_COUNT_2 > 0 && ext_tag_enable && pcie_tag_fifo_2_rd_ptr_reg != pcie_tag_fifo_2_wr_ptr_reg) begin
|
|
req_pcie_tag_next = pcie_tag_fifo_2_mem[pcie_tag_fifo_2_rd_ptr_reg[PCIE_TAG_WIDTH_2-1:0]];
|
|
req_pcie_tag_valid_next = 1'b1;
|
|
pcie_tag_fifo_2_rd_ptr_next = pcie_tag_fifo_2_rd_ptr_reg + 1;
|
|
end
|
|
end
|
|
end
|
|
|
|
always @* begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
|
|
last_cycle = 1'b0;
|
|
|
|
s_axis_rc_tready_next = 1'b0;
|
|
|
|
lower_addr_next = lower_addr_reg;
|
|
byte_count_next = byte_count_reg;
|
|
error_code_next = error_code_reg;
|
|
ram_sel_next = ram_sel_reg;
|
|
addr_next = addr_reg;
|
|
addr_delay_next = addr_delay_reg;
|
|
op_count_next = op_count_reg;
|
|
zero_len_next = zero_len_reg;
|
|
ram_mask_next = ram_mask_reg;
|
|
ram_mask_0_next = ram_mask_0_reg;
|
|
ram_mask_1_next = ram_mask_1_reg;
|
|
ram_wrap_next = ram_wrap_reg;
|
|
cycle_byte_count_next = cycle_byte_count_reg;
|
|
start_offset_next = start_offset_reg;
|
|
end_offset_next = end_offset_reg;
|
|
op_dword_count_next = op_dword_count_reg;
|
|
cpl_status_next = cpl_status_reg;
|
|
pcie_tag_next = pcie_tag_reg;
|
|
op_tag_next = op_tag_reg;
|
|
final_cpl_next = final_cpl_reg;
|
|
finish_tag_next = 1'b0;
|
|
offset_next = offset_reg;
|
|
|
|
rc_tdata_int_next = s_axis_rc_tdata;
|
|
rc_tvalid_int_next = 1'b0;
|
|
|
|
status_fifo_mask_next = 1'b1;
|
|
status_fifo_finish_next = 1'b0;
|
|
status_fifo_error_next = DMA_ERROR_NONE;
|
|
status_fifo_wr_en_next = 1'b0;
|
|
|
|
out_done_ack = {SEG_COUNT{1'b0}};
|
|
|
|
// Write generation
|
|
ram_wr_cmd_sel_int = {SEG_COUNT{ram_sel_reg}};
|
|
if (!ram_wrap_reg) begin
|
|
ram_wr_cmd_be_int = ({SEG_COUNT*SEG_BE_WIDTH{1'b1}} << start_offset_reg) & ({SEG_COUNT*SEG_BE_WIDTH{1'b1}} >> (SEG_COUNT*SEG_BE_WIDTH-1-end_offset_reg));
|
|
end else begin
|
|
ram_wr_cmd_be_int = ({SEG_COUNT*SEG_BE_WIDTH{1'b1}} << start_offset_reg) | ({SEG_COUNT*SEG_BE_WIDTH{1'b1}} >> (SEG_COUNT*SEG_BE_WIDTH-1-end_offset_reg));
|
|
end
|
|
for (i = 0; i < SEG_COUNT; i = i + 1) begin
|
|
ram_wr_cmd_addr_int[i*SEG_ADDR_WIDTH +: SEG_ADDR_WIDTH] = addr_delay_reg[RAM_ADDR_WIDTH-1:RAM_ADDR_WIDTH-SEG_ADDR_WIDTH];
|
|
if (ram_mask_1_reg[i]) begin
|
|
ram_wr_cmd_addr_int[i*SEG_ADDR_WIDTH +: SEG_ADDR_WIDTH] = addr_delay_reg[RAM_ADDR_WIDTH-1:RAM_ADDR_WIDTH-SEG_ADDR_WIDTH]+1;
|
|
end
|
|
end
|
|
ram_wr_cmd_data_int = {3{rc_tdata_int_reg}} >> (AXIS_PCIE_DATA_WIDTH - offset_reg*8);
|
|
ram_wr_cmd_valid_int = {SEG_COUNT{1'b0}};
|
|
|
|
if (rc_tvalid_int_reg) begin
|
|
ram_wr_cmd_valid_int = ram_mask_reg;
|
|
end
|
|
|
|
status_error_cor_next = 1'b0;
|
|
status_error_uncor_next = 1'b0;
|
|
|
|
// TLP response handling
|
|
case (tlp_state_reg)
|
|
TLP_STATE_IDLE: begin
|
|
// idle state, wait for completion
|
|
if (AXIS_PCIE_DATA_WIDTH > 64) begin
|
|
s_axis_rc_tready_next = init_done_reg && &ram_wr_cmd_ready_int && !status_fifo_half_full_reg;
|
|
|
|
if (s_axis_rc_tready && s_axis_rc_tvalid) begin
|
|
// header fields
|
|
lower_addr_next = s_axis_rc_tdata[11:0]; // lower address
|
|
error_code_next = s_axis_rc_tdata[15:12]; // error code
|
|
byte_count_next = s_axis_rc_tdata[28:16]; // byte count
|
|
//s_axis_rc_tdata[29]; // locked read
|
|
//s_axis_rc_tdata[30]; // request completed
|
|
op_dword_count_next = s_axis_rc_tdata[42:32]; // DWORD count
|
|
cpl_status_next = s_axis_rc_tdata[45:43]; // completion status
|
|
//s_axis_rc_tdata[46]; // poisoned completion
|
|
//s_axis_rc_tdata[63:48]; // requester ID
|
|
pcie_tag_next = s_axis_rc_tdata[71:64]; // tag
|
|
//s_axis_rc_tdata[87:72]; // completer ID
|
|
//s_axis_rc_tdata[91:89]; // tc
|
|
//s_axis_rc_tdata[94:92]; // attr
|
|
|
|
// tuser fields
|
|
//s_axis_rc_tuser[31:0]; // byte enables
|
|
//s_axis_rc_tuser[32]; // is_sof_0
|
|
//s_axis_rc_tuser[33]; // is_sof_1
|
|
//s_axis_rc_tuser[37:34]; // is_eof_0
|
|
//s_axis_rc_tuser[41:38]; // is_eof_1
|
|
//s_axis_rc_tuser[42]; // discontinue
|
|
//s_axis_rc_tuser[74:43]; // parity
|
|
|
|
ram_sel_next = pcie_tag_table_ram_sel[pcie_tag_next];
|
|
addr_next = pcie_tag_table_ram_addr[pcie_tag_next] - byte_count_next;
|
|
zero_len_next = pcie_tag_table_zero_len[pcie_tag_next];
|
|
|
|
offset_next = addr_next[OFFSET_WIDTH-1:0] - (12+lower_addr_next[1:0]);
|
|
|
|
if (byte_count_next > (op_dword_count_next << 2) - lower_addr_next[1:0]) begin
|
|
// more completions to follow
|
|
op_count_next = (op_dword_count_next << 2) - lower_addr_next[1:0];
|
|
final_cpl_next = 1'b0;
|
|
|
|
if (op_dword_count_next > (AXIS_PCIE_DATA_WIDTH/32-3)) begin
|
|
// more than one cycle
|
|
cycle_byte_count_next = (AXIS_PCIE_DATA_WIDTH/8-12)-lower_addr_next[1:0];
|
|
last_cycle = 1'b0;
|
|
|
|
start_offset_next = addr_next;
|
|
{ram_wrap_next, end_offset_next} = start_offset_next+cycle_byte_count_next-1;
|
|
end else begin
|
|
// one cycle
|
|
cycle_byte_count_next = op_count_next;
|
|
last_cycle = 1'b1;
|
|
|
|
start_offset_next = addr_next;
|
|
{ram_wrap_next, end_offset_next} = start_offset_next+cycle_byte_count_next-1;
|
|
end
|
|
end else begin
|
|
// last completion
|
|
op_count_next = byte_count_next;
|
|
final_cpl_next = 1'b1;
|
|
|
|
if (op_count_next > (AXIS_PCIE_DATA_WIDTH/8-12)-lower_addr_next[1:0]) begin
|
|
// more than one cycle
|
|
cycle_byte_count_next = (AXIS_PCIE_DATA_WIDTH/8-12)-lower_addr_next[1:0];
|
|
last_cycle = 1'b0;
|
|
|
|
start_offset_next = addr_next;
|
|
{ram_wrap_next, end_offset_next} = start_offset_next+cycle_byte_count_next-1;
|
|
end else begin
|
|
// one cycle
|
|
cycle_byte_count_next = op_count_next;
|
|
last_cycle = 1'b1;
|
|
|
|
start_offset_next = addr_next;
|
|
{ram_wrap_next, end_offset_next} = start_offset_next+cycle_byte_count_next-1;
|
|
end
|
|
end
|
|
|
|
ram_mask_0_next = {SEG_COUNT{1'b1}} << (start_offset_next >> $clog2(SEG_BE_WIDTH));
|
|
ram_mask_1_next = {SEG_COUNT{1'b1}} >> (SEG_COUNT-1-(end_offset_next >> $clog2(SEG_BE_WIDTH)));
|
|
|
|
if (!ram_wrap_next) begin
|
|
ram_mask_next = ram_mask_0_next & ram_mask_1_next;
|
|
ram_mask_0_next = ram_mask_0_next & ram_mask_1_next;
|
|
ram_mask_1_next = 0;
|
|
end else begin
|
|
ram_mask_next = ram_mask_0_next | ram_mask_1_next;
|
|
end
|
|
|
|
addr_delay_next = addr_next;
|
|
addr_next = addr_next + cycle_byte_count_next;
|
|
op_count_next = op_count_next - cycle_byte_count_next;
|
|
|
|
op_tag_next = pcie_tag_table_op_tag[pcie_tag_next];
|
|
|
|
if (pcie_tag_table_active_b[pcie_tag_next] == pcie_tag_table_active_a[pcie_tag_next]) begin
|
|
// tag not active, handle as unexpected completion (2.3.2), advisory non-fatal (6.2.3.2.4.5)
|
|
|
|
// drop TLP and report correctable error
|
|
status_error_cor_next = 1'b1;
|
|
if (s_axis_rc_tlast) begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else if (error_code_next == RC_ERROR_MISMATCH) begin
|
|
// format/status mismatch, handle as malformed TLP (2.3.2)
|
|
// ATTR or TC mismatch, handle as malformed TLP (2.3.2)
|
|
|
|
// drop TLP and report uncorrectable error
|
|
status_error_uncor_next = 1'b1;
|
|
if (s_axis_rc_tlast) begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else if (error_code_next == RC_ERROR_POISONED || error_code_next == RC_ERROR_BAD_STATUS ||
|
|
error_code_next == RC_ERROR_TIMEOUT || error_code_next == RC_ERROR_FLR) begin
|
|
// transfer-terminating error
|
|
|
|
if (error_code_next == RC_ERROR_POISONED) begin
|
|
// poisoned TLP, handle as advisory non-fatal (6.2.3.2.4.3)
|
|
// drop TLP and report correctable error
|
|
status_error_cor_next = 1'b1;
|
|
status_fifo_error_next = DMA_ERROR_PCIE_CPL_POISONED;
|
|
end else if (error_code_next == RC_ERROR_BAD_STATUS) begin
|
|
// bad status, handle as advisory non-fatal (6.2.3.2.4.1)
|
|
// drop TLP and report correctable error
|
|
status_error_cor_next = 1'b1;
|
|
if (cpl_status_next == CPL_STATUS_CA) begin
|
|
status_fifo_error_next = DMA_ERROR_PCIE_CPL_STATUS_CA;
|
|
end else begin
|
|
status_fifo_error_next = DMA_ERROR_PCIE_CPL_STATUS_UR;
|
|
end
|
|
end else if (error_code_next == RC_ERROR_TIMEOUT) begin
|
|
// timeout, handle as uncorrectable (6.2.3.2.4.4)
|
|
// drop TLP and report uncorrectable error
|
|
status_error_uncor_next = 1'b1;
|
|
status_fifo_error_next = DMA_ERROR_TIMEOUT;
|
|
end else if (error_code_next == RC_ERROR_FLR) begin
|
|
// FLR; not an actual completion so no error to report
|
|
// drop TLP
|
|
status_fifo_error_next = DMA_ERROR_PCIE_FLR;
|
|
end
|
|
|
|
finish_tag_next = 1'b1;
|
|
|
|
status_fifo_mask_next = 1'b0;
|
|
status_fifo_finish_next = 1'b1;
|
|
status_fifo_wr_en_next = 1'b1;
|
|
|
|
if (s_axis_rc_tlast) begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else begin
|
|
// no error
|
|
|
|
rc_tdata_int_next = s_axis_rc_tdata;
|
|
rc_tvalid_int_next = 1'b1;
|
|
|
|
status_fifo_mask_next = 1'b1;
|
|
status_fifo_finish_next = 1'b0;
|
|
status_fifo_error_next = DMA_ERROR_NONE;
|
|
status_fifo_wr_en_next = 1'b1;
|
|
|
|
if (zero_len_next) begin
|
|
rc_tvalid_int_next = 1'b0;
|
|
status_fifo_mask_next = 1'b0;
|
|
end
|
|
|
|
if (last_cycle) begin
|
|
if (final_cpl_next) begin
|
|
// last completion in current read request (PCIe tag)
|
|
|
|
// release tag
|
|
finish_tag_next = 1'b1;
|
|
status_fifo_finish_next = 1'b1;
|
|
end
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_WRITE;
|
|
end
|
|
end
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
|
|
if (s_axis_rc_tready && s_axis_rc_tvalid) begin
|
|
// header fields
|
|
lower_addr_next = s_axis_rc_tdata[11:0]; // lower address
|
|
error_code_next = s_axis_rc_tdata[15:12]; // error code
|
|
byte_count_next = s_axis_rc_tdata[28:16]; // byte count
|
|
//s_axis_rc_tdata[29]; // locked read
|
|
//s_axis_rc_tdata[30]; // request completed
|
|
op_dword_count_next = s_axis_rc_tdata[42:32]; // DWORD count
|
|
cpl_status_next = s_axis_rc_tdata[45:43]; // completion status
|
|
//s_axis_rc_tdata[46]; // poisoned completion
|
|
//s_axis_rc_tdata[63:48]; // requester ID
|
|
|
|
// tuser fields
|
|
//s_axis_rc_tuser[31:0]; // byte enables
|
|
//s_axis_rc_tuser[32]; // is_sof_0
|
|
//s_axis_rc_tuser[33]; // is_sof_1
|
|
//s_axis_rc_tuser[37:34]; // is_eof_0
|
|
//s_axis_rc_tuser[41:38]; // is_eof_1
|
|
//s_axis_rc_tuser[42]; // discontinue
|
|
//s_axis_rc_tuser[74:43]; // parity
|
|
|
|
if (byte_count_next > (op_dword_count_next << 2) - lower_addr_next[1:0]) begin
|
|
// more completions to follow
|
|
op_count_next = (op_dword_count_next << 2) - lower_addr_next[1:0];
|
|
final_cpl_next = 1'b0;
|
|
end else begin
|
|
// last completion
|
|
op_count_next = byte_count_next;
|
|
final_cpl_next = 1'b1;
|
|
end
|
|
|
|
if (s_axis_rc_tlast) begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg && &ram_wr_cmd_ready_int && !status_fifo_half_full_reg;
|
|
tlp_state_next = TLP_STATE_HEADER;
|
|
end
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end
|
|
end
|
|
end
|
|
TLP_STATE_HEADER: begin
|
|
// header state; process header (64 bit interface only)
|
|
s_axis_rc_tready_next = init_done_reg && &ram_wr_cmd_ready_int && !status_fifo_half_full_reg;
|
|
|
|
if (s_axis_rc_tready && s_axis_rc_tvalid) begin
|
|
pcie_tag_next = s_axis_rc_tdata[7:0]; // tag
|
|
//s_axis_rc_tdata[23:8]; // completer ID
|
|
//s_axis_rc_tdata[27:25]; // attr
|
|
//s_axis_rc_tdata[30:28]; // tc
|
|
|
|
ram_sel_next = pcie_tag_table_ram_sel[pcie_tag_next];
|
|
addr_next = pcie_tag_table_ram_addr[pcie_tag_next] - byte_count_reg;
|
|
zero_len_next = pcie_tag_table_zero_len[pcie_tag_next];
|
|
|
|
offset_next = addr_next[OFFSET_WIDTH-1:0] - (4+lower_addr_reg[1:0]);
|
|
|
|
if (op_count_next > 4-lower_addr_reg[1:0]) begin
|
|
// more than one cycle
|
|
cycle_byte_count_next = 4-lower_addr_reg[1:0];
|
|
last_cycle = 1'b0;
|
|
end else begin
|
|
// one cycle
|
|
cycle_byte_count_next = op_count_next;
|
|
last_cycle = 1'b1;
|
|
end
|
|
start_offset_next = addr_next;
|
|
{ram_wrap_next, end_offset_next} = start_offset_next+cycle_byte_count_next-1;
|
|
|
|
ram_mask_0_next = {SEG_COUNT{1'b1}} << (start_offset_next >> $clog2(SEG_BE_WIDTH));
|
|
ram_mask_1_next = {SEG_COUNT{1'b1}} >> (SEG_COUNT-1-(end_offset_next >> $clog2(SEG_BE_WIDTH)));
|
|
|
|
if (!ram_wrap_next) begin
|
|
ram_mask_next = ram_mask_0_next & ram_mask_1_next;
|
|
ram_mask_0_next = ram_mask_0_next & ram_mask_1_next;
|
|
ram_mask_1_next = 0;
|
|
end else begin
|
|
ram_mask_next = ram_mask_0_next | ram_mask_1_next;
|
|
end
|
|
|
|
addr_delay_next = addr_next;
|
|
addr_next = addr_next + cycle_byte_count_next;
|
|
op_count_next = op_count_next - cycle_byte_count_next;
|
|
|
|
op_tag_next = pcie_tag_table_op_tag[pcie_tag_next];
|
|
|
|
if (pcie_tag_table_active_b[pcie_tag_next] == pcie_tag_table_active_a[pcie_tag_next]) begin
|
|
// tag not active, handle as unexpected completion (2.3.2), advisory non-fatal (6.2.3.2.4.5)
|
|
|
|
// drop TLP and report correctable error
|
|
status_error_cor_next = 1'b1;
|
|
if (s_axis_rc_tlast) begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else if (error_code_next == RC_ERROR_MISMATCH) begin
|
|
// format/status mismatch, handle as malformed TLP (2.3.2)
|
|
// ATTR or TC mismatch, handle as malformed TLP (2.3.2)
|
|
|
|
// drop TLP and report uncorrectable error
|
|
status_error_uncor_next = 1'b1;
|
|
if (s_axis_rc_tlast) begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else if (error_code_next == RC_ERROR_POISONED || error_code_next == RC_ERROR_BAD_STATUS ||
|
|
error_code_next == RC_ERROR_TIMEOUT || error_code_next == RC_ERROR_FLR) begin
|
|
// transfer-terminating error
|
|
|
|
if (error_code_next == RC_ERROR_POISONED) begin
|
|
// poisoned TLP, handle as advisory non-fatal (6.2.3.2.4.3)
|
|
// drop TLP and report correctable error
|
|
status_error_cor_next = 1'b1;
|
|
status_fifo_error_next = DMA_ERROR_PCIE_CPL_POISONED;
|
|
end else if (error_code_next == RC_ERROR_BAD_STATUS) begin
|
|
// bad status, handle as advisory non-fatal (6.2.3.2.4.1)
|
|
// drop TLP and report correctable error
|
|
status_error_cor_next = 1'b1;
|
|
if (cpl_status_reg == CPL_STATUS_CA) begin
|
|
status_fifo_error_next = DMA_ERROR_PCIE_CPL_STATUS_CA;
|
|
end else begin
|
|
status_fifo_error_next = DMA_ERROR_PCIE_CPL_STATUS_UR;
|
|
end
|
|
end else if (error_code_next == RC_ERROR_TIMEOUT) begin
|
|
// timeout, handle as uncorrectable (6.2.3.2.4.4)
|
|
// drop TLP and report uncorrectable error
|
|
status_error_uncor_next = 1'b1;
|
|
status_fifo_error_next = DMA_ERROR_TIMEOUT;
|
|
end else if (error_code_next == RC_ERROR_FLR) begin
|
|
// FLR; not an actual completion so no error to report
|
|
// drop TLP
|
|
status_fifo_error_next = DMA_ERROR_PCIE_FLR;
|
|
end
|
|
|
|
finish_tag_next = 1'b1;
|
|
|
|
status_fifo_mask_next = 1'b0;
|
|
status_fifo_finish_next = 1'b1;
|
|
status_fifo_wr_en_next = 1'b1;
|
|
|
|
if (s_axis_rc_tlast) begin
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else begin
|
|
// no error
|
|
|
|
if (zero_len_next) begin
|
|
status_fifo_mask_next = 1'b0;
|
|
end else begin
|
|
rc_tdata_int_next = s_axis_rc_tdata;
|
|
rc_tvalid_int_next = 1'b1;
|
|
|
|
status_fifo_mask_next = 1'b1;
|
|
end
|
|
|
|
status_fifo_finish_next = 1'b0;
|
|
status_fifo_error_next = DMA_ERROR_NONE;
|
|
status_fifo_wr_en_next = 1'b1;
|
|
|
|
if (last_cycle) begin
|
|
if (final_cpl_next) begin
|
|
// last completion in current read request (PCIe tag)
|
|
|
|
// release tag
|
|
finish_tag_next = 1'b1;
|
|
status_fifo_finish_next = 1'b1;
|
|
end
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_WRITE;
|
|
end
|
|
end
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_HEADER;
|
|
end
|
|
end
|
|
TLP_STATE_WRITE: begin
|
|
// write state - generate write operations
|
|
s_axis_rc_tready_next = init_done_reg && &ram_wr_cmd_ready_int && !status_fifo_half_full_reg;
|
|
|
|
if (s_axis_rc_tready && s_axis_rc_tvalid) begin
|
|
rc_tdata_int_next = s_axis_rc_tdata;
|
|
rc_tvalid_int_next = 1'b1;
|
|
|
|
if (op_count_next > AXIS_PCIE_DATA_WIDTH/8) begin
|
|
// more cycles after this one
|
|
cycle_byte_count_next = AXIS_PCIE_DATA_WIDTH/8;
|
|
last_cycle = 1'b0;
|
|
end else begin
|
|
// last cycle
|
|
cycle_byte_count_next = op_count_next;
|
|
last_cycle = 1'b1;
|
|
end
|
|
start_offset_next = addr_next;
|
|
{ram_wrap_next, end_offset_next} = start_offset_next+cycle_byte_count_next-1;
|
|
|
|
ram_mask_0_next = {SEG_COUNT{1'b1}} << (start_offset_next >> $clog2(SEG_BE_WIDTH));
|
|
ram_mask_1_next = {SEG_COUNT{1'b1}} >> (SEG_COUNT-1-(end_offset_next >> $clog2(SEG_BE_WIDTH)));
|
|
|
|
if (!ram_wrap_next) begin
|
|
ram_mask_next = ram_mask_0_next & ram_mask_1_next;
|
|
ram_mask_0_next = ram_mask_0_next & ram_mask_1_next;
|
|
ram_mask_1_next = 0;
|
|
end else begin
|
|
ram_mask_next = ram_mask_0_next | ram_mask_1_next;
|
|
end
|
|
|
|
addr_delay_next = addr_reg;
|
|
addr_next = addr_reg + cycle_byte_count_next;
|
|
op_count_next = op_count_reg - cycle_byte_count_next;
|
|
|
|
status_fifo_mask_next = 1'b1;
|
|
status_fifo_finish_next = 1'b0;
|
|
status_fifo_error_next = DMA_ERROR_NONE;
|
|
status_fifo_wr_en_next = 1'b1;
|
|
|
|
if (last_cycle) begin
|
|
if (final_cpl_reg) begin
|
|
// last completion in current read request (PCIe tag)
|
|
|
|
// release tag
|
|
finish_tag_next = 1'b1;
|
|
status_fifo_finish_next = 1'b1;
|
|
end
|
|
|
|
if (AXIS_PCIE_DATA_WIDTH == 64) begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
end
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_WRITE;
|
|
end
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_WRITE;
|
|
end
|
|
end
|
|
TLP_STATE_WAIT_END: begin
|
|
// wait end state, wait for end of TLP
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
|
|
if (s_axis_rc_tready & s_axis_rc_tvalid) begin
|
|
if (s_axis_rc_tlast) begin
|
|
if (AXIS_PCIE_DATA_WIDTH > 64) begin
|
|
s_axis_rc_tready_next = init_done_reg && &ram_wr_cmd_ready_int && !status_fifo_half_full_reg;
|
|
end else begin
|
|
s_axis_rc_tready_next = init_done_reg;
|
|
end
|
|
tlp_state_next = TLP_STATE_IDLE;
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end else begin
|
|
tlp_state_next = TLP_STATE_WAIT_END;
|
|
end
|
|
end
|
|
endcase
|
|
|
|
pcie_tag_table_finish_ptr = pcie_tag_reg;
|
|
pcie_tag_table_finish_en = 1'b0;
|
|
|
|
pcie_tag_fifo_wr_tag = pcie_tag_reg;
|
|
pcie_tag_fifo_1_we = 1'b0;
|
|
pcie_tag_fifo_2_we = 1'b0;
|
|
|
|
if (init_pcie_tag_reg) begin
|
|
// initialize FIFO
|
|
pcie_tag_fifo_wr_tag = init_count_reg;
|
|
if (pcie_tag_fifo_wr_tag < PCIE_TAG_COUNT_1) begin
|
|
pcie_tag_fifo_1_we = 1'b1;
|
|
end else if (pcie_tag_fifo_wr_tag) begin
|
|
pcie_tag_fifo_2_we = 1'b1;
|
|
end
|
|
end else if (finish_tag_reg) begin
|
|
pcie_tag_table_finish_ptr = pcie_tag_reg;
|
|
pcie_tag_table_finish_en = 1'b1;
|
|
|
|
pcie_tag_fifo_wr_tag = pcie_tag_reg;
|
|
if (pcie_tag_fifo_wr_tag < PCIE_TAG_COUNT_1) begin
|
|
pcie_tag_fifo_1_we = 1'b1;
|
|
end else begin
|
|
pcie_tag_fifo_2_we = 1'b1;
|
|
end
|
|
end
|
|
|
|
status_fifo_wr_op_tag = op_tag_reg;
|
|
status_fifo_wr_mask = status_fifo_mask_reg ? ram_mask_reg : 0;
|
|
status_fifo_wr_finish = status_fifo_finish_reg;
|
|
status_fifo_wr_error = status_fifo_error_reg;
|
|
status_fifo_wr_en = status_fifo_wr_en_reg;
|
|
|
|
status_fifo_rd_valid_next = status_fifo_rd_valid_reg;
|
|
status_fifo_rd_en = 1'b0;
|
|
|
|
m_axis_read_desc_status_tag_next = op_table_tag[status_fifo_rd_op_tag_reg];
|
|
if (status_fifo_rd_error_reg != DMA_ERROR_NONE) begin
|
|
m_axis_read_desc_status_error_next = status_fifo_rd_error_reg;
|
|
end else if (op_table_error_a[status_fifo_rd_op_tag_reg] != op_table_error_b[status_fifo_rd_op_tag_reg]) begin
|
|
m_axis_read_desc_status_error_next = op_table_error_code[status_fifo_rd_op_tag_reg];
|
|
end else begin
|
|
m_axis_read_desc_status_error_next = DMA_ERROR_NONE;
|
|
end
|
|
m_axis_read_desc_status_valid_next = 1'b0;
|
|
|
|
op_table_update_status_ptr = status_fifo_rd_op_tag_reg;
|
|
if (status_fifo_rd_error_reg != DMA_ERROR_NONE) begin
|
|
op_table_update_status_error = status_fifo_rd_error_reg;
|
|
end else begin
|
|
op_table_update_status_error = DMA_ERROR_NONE;
|
|
end
|
|
op_table_update_status_en = 1'b0;
|
|
|
|
op_table_read_finish_ptr = status_fifo_rd_op_tag_reg;
|
|
op_table_read_finish_en = 1'b0;
|
|
|
|
op_tag_fifo_wr_tag = status_fifo_rd_op_tag_reg;
|
|
op_tag_fifo_we = 1'b0;
|
|
|
|
if (init_op_tag_reg) begin
|
|
// initialize FIFO
|
|
op_tag_fifo_wr_tag = init_count_reg;
|
|
op_tag_fifo_we = 1'b1;
|
|
end else if (status_fifo_rd_valid_reg && (status_fifo_rd_mask_reg & ~out_done) == 0) begin
|
|
// got write completion, pop and return status
|
|
status_fifo_rd_valid_next = 1'b0;
|
|
op_table_update_status_en = 1'b1;
|
|
|
|
out_done_ack = status_fifo_rd_mask_reg;
|
|
|
|
if (status_fifo_rd_finish_reg) begin
|
|
// mark done
|
|
op_table_read_finish_en = 1'b1;
|
|
|
|
if (op_table_read_commit[op_table_read_finish_ptr] && (op_table_read_count_start[op_table_read_finish_ptr] == op_table_read_count_finish[op_table_read_finish_ptr])) begin
|
|
op_tag_fifo_we = 1'b1;
|
|
m_axis_read_desc_status_valid_next = 1'b1;
|
|
end
|
|
end
|
|
end
|
|
|
|
if (!status_fifo_rd_valid_next && status_fifo_rd_ptr_reg != status_fifo_wr_ptr_reg) begin
|
|
// status FIFO not empty
|
|
status_fifo_rd_en = 1'b1;
|
|
status_fifo_rd_valid_next = 1'b1;
|
|
end
|
|
end
|
|
|
|
always @(posedge clk) begin
|
|
req_state_reg <= req_state_next;
|
|
tlp_state_reg <= tlp_state_next;
|
|
|
|
if (!init_done_reg) begin
|
|
{init_done_reg, init_count_reg} <= init_count_reg + 1;
|
|
init_pcie_tag_reg <= init_count_reg + 1 < 2**PCIE_TAG_WIDTH;
|
|
init_op_tag_reg <= init_count_reg + 1 < 2**OP_TAG_WIDTH;
|
|
end
|
|
|
|
status_error_cor_reg <= status_error_cor_next;
|
|
status_error_uncor_reg <= status_error_uncor_next;
|
|
|
|
req_pcie_addr_reg <= req_pcie_addr_next;
|
|
req_ram_sel_reg <= req_ram_sel_next;
|
|
req_ram_addr_reg <= req_ram_addr_next;
|
|
req_op_count_reg <= req_op_count_next;
|
|
req_tlp_count_reg <= req_tlp_count_next;
|
|
req_zero_len_reg <= req_zero_len_next;
|
|
req_op_tag_reg <= req_op_tag_next;
|
|
req_op_tag_valid_reg <= req_op_tag_valid_next;
|
|
req_pcie_tag_reg <= req_pcie_tag_next;
|
|
req_pcie_tag_valid_reg <= req_pcie_tag_valid_next;
|
|
|
|
lower_addr_reg <= lower_addr_next;
|
|
byte_count_reg <= byte_count_next;
|
|
error_code_reg <= error_code_next;
|
|
ram_sel_reg <= ram_sel_next;
|
|
addr_reg <= addr_next;
|
|
addr_delay_reg <= addr_delay_next;
|
|
op_count_reg <= op_count_next;
|
|
zero_len_reg <= zero_len_next;
|
|
ram_mask_reg <= ram_mask_next;
|
|
ram_mask_0_reg <= ram_mask_0_next;
|
|
ram_mask_1_reg <= ram_mask_1_next;
|
|
ram_wrap_reg <= ram_wrap_next;
|
|
cycle_byte_count_reg <= cycle_byte_count_next;
|
|
start_offset_reg <= start_offset_next;
|
|
end_offset_reg <= end_offset_next;
|
|
op_dword_count_reg <= op_dword_count_next;
|
|
cpl_status_reg <= cpl_status_next;
|
|
pcie_tag_reg <= pcie_tag_next;
|
|
op_tag_reg <= op_tag_next;
|
|
final_cpl_reg <= final_cpl_next;
|
|
finish_tag_reg <= finish_tag_next;
|
|
|
|
offset_reg <= offset_next;
|
|
|
|
rc_tdata_int_reg <= rc_tdata_int_next;
|
|
rc_tvalid_int_reg <= rc_tvalid_int_next;
|
|
|
|
s_axis_rc_tready_reg <= s_axis_rc_tready_next;
|
|
s_axis_read_desc_ready_reg <= s_axis_read_desc_ready_next;
|
|
|
|
m_axis_read_desc_status_tag_reg <= m_axis_read_desc_status_tag_next;
|
|
m_axis_read_desc_status_error_reg <= m_axis_read_desc_status_error_next;
|
|
m_axis_read_desc_status_valid_reg <= m_axis_read_desc_status_valid_next;
|
|
|
|
max_read_request_size_dw_reg <= 11'd32 << (max_read_request_size > 5 ? 5 : max_read_request_size);
|
|
|
|
have_credit_reg <= pcie_tx_fc_nph_av > 4;
|
|
|
|
if (status_fifo_wr_en) begin
|
|
status_fifo_op_tag[status_fifo_wr_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]] <= status_fifo_wr_op_tag;
|
|
status_fifo_mask[status_fifo_wr_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]] <= status_fifo_wr_mask;
|
|
status_fifo_finish[status_fifo_wr_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]] <= status_fifo_wr_finish;
|
|
status_fifo_error[status_fifo_wr_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]] <= status_fifo_wr_error;
|
|
status_fifo_wr_ptr_reg <= status_fifo_wr_ptr_reg + 1;
|
|
end
|
|
|
|
if (status_fifo_rd_en) begin
|
|
status_fifo_rd_op_tag_reg <= status_fifo_op_tag[status_fifo_rd_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]];
|
|
status_fifo_rd_mask_reg <= status_fifo_mask[status_fifo_rd_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]];
|
|
status_fifo_rd_finish_reg <= status_fifo_finish[status_fifo_rd_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]];
|
|
status_fifo_rd_error_reg <= status_fifo_error[status_fifo_rd_ptr_reg[STATUS_FIFO_ADDR_WIDTH-1:0]];
|
|
status_fifo_rd_ptr_reg <= status_fifo_rd_ptr_reg + 1;
|
|
end
|
|
|
|
status_fifo_mask_reg <= status_fifo_mask_next;
|
|
status_fifo_finish_reg <= status_fifo_finish_next;
|
|
status_fifo_error_reg <= status_fifo_error_next;
|
|
status_fifo_wr_en_reg <= status_fifo_wr_en_next;
|
|
|
|
status_fifo_rd_valid_reg <= status_fifo_rd_valid_next;
|
|
|
|
status_fifo_half_full_reg <= $unsigned(status_fifo_wr_ptr_reg - status_fifo_rd_ptr_reg) >= 2**(STATUS_FIFO_ADDR_WIDTH-1);
|
|
|
|
if (active_tx_count_reg < TX_LIMIT && inc_active_tx && !s_axis_rq_seq_num_valid_0 && !s_axis_rq_seq_num_valid_1) begin
|
|
// inc by 1
|
|
active_tx_count_reg <= active_tx_count_reg + 1;
|
|
active_tx_count_av_reg <= active_tx_count_reg < (TX_LIMIT-1);
|
|
end else if (active_tx_count_reg > 0 && ((inc_active_tx && s_axis_rq_seq_num_valid_0 && s_axis_rq_seq_num_valid_1) || (!inc_active_tx && (s_axis_rq_seq_num_valid_0 ^ s_axis_rq_seq_num_valid_1)))) begin
|
|
// dec by 1
|
|
active_tx_count_reg <= active_tx_count_reg - 1;
|
|
active_tx_count_av_reg <= 1'b1;
|
|
end else if (active_tx_count_reg > 1 && !inc_active_tx && s_axis_rq_seq_num_valid_0 && s_axis_rq_seq_num_valid_1) begin
|
|
// dec by 2
|
|
active_tx_count_reg <= active_tx_count_reg - 2;
|
|
active_tx_count_av_reg <= 1'b1;
|
|
end else begin
|
|
active_tx_count_av_reg <= active_tx_count_reg < TX_LIMIT;
|
|
end
|
|
|
|
pcie_tag_table_start_ptr_reg <= pcie_tag_table_start_ptr_next;
|
|
pcie_tag_table_start_ram_sel_reg <= pcie_tag_table_start_ram_sel_next;
|
|
pcie_tag_table_start_ram_addr_reg <= pcie_tag_table_start_ram_addr_next;
|
|
pcie_tag_table_start_op_tag_reg <= pcie_tag_table_start_op_tag_next;
|
|
pcie_tag_table_start_zero_len_reg <= pcie_tag_table_start_zero_len_next;
|
|
pcie_tag_table_start_en_reg <= pcie_tag_table_start_en_next;
|
|
|
|
if (init_pcie_tag_reg) begin
|
|
pcie_tag_table_active_a[init_count_reg] <= 1'b0;
|
|
end else if (pcie_tag_table_start_en_reg) begin
|
|
pcie_tag_table_ram_sel[pcie_tag_table_start_ptr_reg] <= pcie_tag_table_start_ram_sel_reg;
|
|
pcie_tag_table_ram_addr[pcie_tag_table_start_ptr_reg] <= pcie_tag_table_start_ram_addr_reg;
|
|
pcie_tag_table_op_tag[pcie_tag_table_start_ptr_reg] <= pcie_tag_table_start_op_tag_reg;
|
|
pcie_tag_table_zero_len[pcie_tag_table_start_ptr_reg] <= pcie_tag_table_start_zero_len_reg;
|
|
pcie_tag_table_active_a[pcie_tag_table_start_ptr_reg] <= !pcie_tag_table_active_b[pcie_tag_table_start_ptr_reg];
|
|
end
|
|
|
|
if (init_pcie_tag_reg) begin
|
|
pcie_tag_table_active_b[init_count_reg] <= 1'b0;
|
|
end else if (pcie_tag_table_finish_en) begin
|
|
pcie_tag_table_active_b[pcie_tag_table_finish_ptr] <= pcie_tag_table_active_a[pcie_tag_table_finish_ptr];
|
|
end
|
|
|
|
if (pcie_tag_fifo_1_we) begin
|
|
pcie_tag_fifo_1_mem[pcie_tag_fifo_1_wr_ptr_reg[PCIE_TAG_WIDTH_1-1:0]] <= pcie_tag_fifo_wr_tag;
|
|
pcie_tag_fifo_1_wr_ptr_reg <= pcie_tag_fifo_1_wr_ptr_reg + 1;
|
|
end
|
|
pcie_tag_fifo_1_rd_ptr_reg <= pcie_tag_fifo_1_rd_ptr_next;
|
|
if (pcie_tag_fifo_2_we) begin
|
|
pcie_tag_fifo_2_mem[pcie_tag_fifo_2_wr_ptr_reg[PCIE_TAG_WIDTH_2-1:0]] <= pcie_tag_fifo_wr_tag;
|
|
pcie_tag_fifo_2_wr_ptr_reg <= pcie_tag_fifo_2_wr_ptr_reg + 1;
|
|
end
|
|
pcie_tag_fifo_2_rd_ptr_reg <= pcie_tag_fifo_2_rd_ptr_next;
|
|
|
|
if (init_op_tag_reg) begin
|
|
op_table_read_init_a[init_count_reg] <= 1'b0;
|
|
op_table_error_a[init_count_reg] <= 1'b0;
|
|
end else if (op_table_start_en) begin
|
|
op_table_tag[op_table_start_ptr] <= op_table_start_tag;
|
|
op_table_read_init_a[op_table_start_ptr] <= !op_table_read_init_b[op_table_start_ptr];
|
|
op_table_error_a[op_table_start_ptr] <= op_table_error_b[op_table_start_ptr];
|
|
end
|
|
|
|
if (init_op_tag_reg) begin
|
|
op_table_read_init_b[init_count_reg] <= 1'b0;
|
|
op_table_read_count_start[init_count_reg] <= 0;
|
|
end else if (op_table_read_start_en) begin
|
|
op_table_read_init_b[op_table_read_start_ptr] <= op_table_read_init_a[op_table_read_start_ptr];
|
|
op_table_read_commit[op_table_read_start_ptr] <= op_table_read_start_commit;
|
|
if (op_table_read_init_b[op_table_read_start_ptr] != op_table_read_init_a[op_table_read_start_ptr]) begin
|
|
op_table_read_count_start[op_table_read_start_ptr] <= op_table_read_count_finish[op_table_read_start_ptr];
|
|
end else begin
|
|
op_table_read_count_start[op_table_read_start_ptr] <= op_table_read_count_start[op_table_read_start_ptr] + 1;
|
|
end
|
|
end
|
|
|
|
if (init_op_tag_reg) begin
|
|
op_table_error_b[init_count_reg] <= 1'b0;
|
|
end else if (op_table_update_status_en) begin
|
|
if (op_table_update_status_error != 0) begin
|
|
op_table_error_code[op_table_update_status_ptr] <= op_table_update_status_error;
|
|
op_table_error_b[op_table_update_status_ptr] <= !op_table_error_a[op_table_update_status_ptr];
|
|
end
|
|
end
|
|
|
|
if (init_op_tag_reg) begin
|
|
op_table_read_count_finish[init_count_reg] <= 0;
|
|
end else if (op_table_read_finish_en) begin
|
|
op_table_read_count_finish[op_table_read_finish_ptr] <= op_table_read_count_finish[op_table_read_finish_ptr] + 1;
|
|
end
|
|
|
|
if (op_tag_fifo_we) begin
|
|
op_tag_fifo_mem[op_tag_fifo_wr_ptr_reg[OP_TAG_WIDTH-1:0]] <= op_tag_fifo_wr_tag;
|
|
op_tag_fifo_wr_ptr_reg <= op_tag_fifo_wr_ptr_reg + 1;
|
|
end
|
|
op_tag_fifo_rd_ptr_reg <= op_tag_fifo_rd_ptr_next;
|
|
|
|
if (rst) begin
|
|
req_state_reg <= REQ_STATE_IDLE;
|
|
tlp_state_reg <= TLP_STATE_IDLE;
|
|
|
|
init_count_reg <= 0;
|
|
init_done_reg <= 1'b0;
|
|
init_pcie_tag_reg <= 1'b1;
|
|
init_op_tag_reg <= 1'b1;
|
|
|
|
req_op_tag_valid_reg <= 1'b0;
|
|
req_pcie_tag_valid_reg <= 1'b0;
|
|
|
|
finish_tag_reg <= 1'b0;
|
|
|
|
rc_tvalid_int_reg <= 1'b0;
|
|
|
|
s_axis_rc_tready_reg <= 1'b0;
|
|
|
|
s_axis_read_desc_ready_reg <= 1'b0;
|
|
m_axis_read_desc_status_valid_reg <= 1'b0;
|
|
|
|
status_fifo_wr_ptr_reg <= 0;
|
|
status_fifo_rd_ptr_reg <= 0;
|
|
status_fifo_wr_en_reg <= 1'b0;
|
|
status_fifo_rd_valid_reg <= 1'b0;
|
|
|
|
active_tx_count_reg <= {RQ_SEQ_NUM_WIDTH{1'b0}};
|
|
active_tx_count_av_reg <= 1'b1;
|
|
|
|
pcie_tag_table_start_en_reg <= 1'b0;
|
|
|
|
pcie_tag_fifo_1_wr_ptr_reg <= 0;
|
|
pcie_tag_fifo_1_rd_ptr_reg <= 0;
|
|
pcie_tag_fifo_2_wr_ptr_reg <= 0;
|
|
pcie_tag_fifo_2_rd_ptr_reg <= 0;
|
|
|
|
op_tag_fifo_wr_ptr_reg <= 0;
|
|
op_tag_fifo_rd_ptr_reg <= 0;
|
|
|
|
status_error_cor_reg <= 1'b0;
|
|
status_error_uncor_reg <= 1'b0;
|
|
end
|
|
end
|
|
|
|
// output datapath logic (PCIe TLP)
|
|
reg [AXIS_PCIE_DATA_WIDTH-1:0] m_axis_rq_tdata_reg = {AXIS_PCIE_DATA_WIDTH{1'b0}};
|
|
reg [AXIS_PCIE_KEEP_WIDTH-1:0] m_axis_rq_tkeep_reg = {AXIS_PCIE_KEEP_WIDTH{1'b0}};
|
|
reg m_axis_rq_tvalid_reg = 1'b0, m_axis_rq_tvalid_next;
|
|
reg m_axis_rq_tlast_reg = 1'b0;
|
|
reg [AXIS_PCIE_RQ_USER_WIDTH-1:0] m_axis_rq_tuser_reg = {AXIS_PCIE_RQ_USER_WIDTH{1'b0}};
|
|
|
|
reg [AXIS_PCIE_DATA_WIDTH-1:0] temp_m_axis_rq_tdata_reg = {AXIS_PCIE_DATA_WIDTH{1'b0}};
|
|
reg [AXIS_PCIE_KEEP_WIDTH-1:0] temp_m_axis_rq_tkeep_reg = {AXIS_PCIE_KEEP_WIDTH{1'b0}};
|
|
reg temp_m_axis_rq_tvalid_reg = 1'b0, temp_m_axis_rq_tvalid_next;
|
|
reg temp_m_axis_rq_tlast_reg = 1'b0;
|
|
reg [AXIS_PCIE_RQ_USER_WIDTH-1:0] temp_m_axis_rq_tuser_reg = {AXIS_PCIE_RQ_USER_WIDTH{1'b0}};
|
|
|
|
// datapath control
|
|
reg store_axis_rq_int_to_output;
|
|
reg store_axis_rq_int_to_temp;
|
|
reg store_axis_rq_temp_to_output;
|
|
|
|
assign m_axis_rq_tdata = m_axis_rq_tdata_reg;
|
|
assign m_axis_rq_tkeep = m_axis_rq_tkeep_reg;
|
|
assign m_axis_rq_tvalid = m_axis_rq_tvalid_reg;
|
|
assign m_axis_rq_tlast = m_axis_rq_tlast_reg;
|
|
assign m_axis_rq_tuser = m_axis_rq_tuser_reg;
|
|
|
|
// enable ready input next cycle if output is ready or the temp reg will not be filled on the next cycle (output reg empty or no input)
|
|
assign m_axis_rq_tready_int_early = m_axis_rq_tready || (!temp_m_axis_rq_tvalid_reg && (!m_axis_rq_tvalid_reg || !m_axis_rq_tvalid_int));
|
|
|
|
always @* begin
|
|
// transfer sink ready state to source
|
|
m_axis_rq_tvalid_next = m_axis_rq_tvalid_reg;
|
|
temp_m_axis_rq_tvalid_next = temp_m_axis_rq_tvalid_reg;
|
|
|
|
store_axis_rq_int_to_output = 1'b0;
|
|
store_axis_rq_int_to_temp = 1'b0;
|
|
store_axis_rq_temp_to_output = 1'b0;
|
|
|
|
if (m_axis_rq_tready_int_reg) begin
|
|
// input is ready
|
|
if (m_axis_rq_tready || !m_axis_rq_tvalid_reg) begin
|
|
// output is ready or currently not valid, transfer data to output
|
|
m_axis_rq_tvalid_next = m_axis_rq_tvalid_int;
|
|
store_axis_rq_int_to_output = 1'b1;
|
|
end else begin
|
|
// output is not ready, store input in temp
|
|
temp_m_axis_rq_tvalid_next = m_axis_rq_tvalid_int;
|
|
store_axis_rq_int_to_temp = 1'b1;
|
|
end
|
|
end else if (m_axis_rq_tready) begin
|
|
// input is not ready, but output is ready
|
|
m_axis_rq_tvalid_next = temp_m_axis_rq_tvalid_reg;
|
|
temp_m_axis_rq_tvalid_next = 1'b0;
|
|
store_axis_rq_temp_to_output = 1'b1;
|
|
end
|
|
end
|
|
|
|
always @(posedge clk) begin
|
|
if (rst) begin
|
|
m_axis_rq_tvalid_reg <= 1'b0;
|
|
m_axis_rq_tready_int_reg <= 1'b0;
|
|
temp_m_axis_rq_tvalid_reg <= 1'b0;
|
|
end else begin
|
|
m_axis_rq_tvalid_reg <= m_axis_rq_tvalid_next;
|
|
m_axis_rq_tready_int_reg <= m_axis_rq_tready_int_early;
|
|
temp_m_axis_rq_tvalid_reg <= temp_m_axis_rq_tvalid_next;
|
|
end
|
|
|
|
// datapath
|
|
if (store_axis_rq_int_to_output) begin
|
|
m_axis_rq_tdata_reg <= m_axis_rq_tdata_int;
|
|
m_axis_rq_tkeep_reg <= m_axis_rq_tkeep_int;
|
|
m_axis_rq_tlast_reg <= m_axis_rq_tlast_int;
|
|
m_axis_rq_tuser_reg <= m_axis_rq_tuser_int;
|
|
end else if (store_axis_rq_temp_to_output) begin
|
|
m_axis_rq_tdata_reg <= temp_m_axis_rq_tdata_reg;
|
|
m_axis_rq_tkeep_reg <= temp_m_axis_rq_tkeep_reg;
|
|
m_axis_rq_tlast_reg <= temp_m_axis_rq_tlast_reg;
|
|
m_axis_rq_tuser_reg <= temp_m_axis_rq_tuser_reg;
|
|
end
|
|
|
|
if (store_axis_rq_int_to_temp) begin
|
|
temp_m_axis_rq_tdata_reg <= m_axis_rq_tdata_int;
|
|
temp_m_axis_rq_tkeep_reg <= m_axis_rq_tkeep_int;
|
|
temp_m_axis_rq_tlast_reg <= m_axis_rq_tlast_int;
|
|
temp_m_axis_rq_tuser_reg <= m_axis_rq_tuser_int;
|
|
end
|
|
end
|
|
|
|
// output datapath logic (write data)
|
|
generate
|
|
|
|
genvar n;
|
|
|
|
for (n = 0; n < SEG_COUNT; n = n + 1) begin
|
|
|
|
reg [RAM_SEL_WIDTH-1:0] ram_wr_cmd_sel_reg = {RAM_SEL_WIDTH{1'b0}};
|
|
reg [SEG_BE_WIDTH-1:0] ram_wr_cmd_be_reg = {SEG_BE_WIDTH{1'b0}};
|
|
reg [SEG_ADDR_WIDTH-1:0] ram_wr_cmd_addr_reg = {SEG_ADDR_WIDTH{1'b0}};
|
|
reg [SEG_DATA_WIDTH-1:0] ram_wr_cmd_data_reg = {SEG_DATA_WIDTH{1'b0}};
|
|
reg ram_wr_cmd_valid_reg = 1'b0;
|
|
|
|
reg [OUTPUT_FIFO_ADDR_WIDTH-1:0] out_fifo_wr_ptr_reg = 0;
|
|
reg [OUTPUT_FIFO_ADDR_WIDTH-1:0] out_fifo_rd_ptr_reg = 0;
|
|
reg out_fifo_half_full_reg = 1'b0;
|
|
|
|
wire out_fifo_full = out_fifo_wr_ptr_reg == (out_fifo_rd_ptr_reg ^ {1'b1, {OUTPUT_FIFO_ADDR_WIDTH{1'b0}}});
|
|
wire out_fifo_empty = out_fifo_wr_ptr_reg == out_fifo_rd_ptr_reg;
|
|
|
|
(* ram_style = "distributed" *)
|
|
reg [RAM_SEL_WIDTH-1:0] out_fifo_wr_cmd_sel[2**OUTPUT_FIFO_ADDR_WIDTH-1:0];
|
|
(* ram_style = "distributed" *)
|
|
reg [SEG_BE_WIDTH-1:0] out_fifo_wr_cmd_be[2**OUTPUT_FIFO_ADDR_WIDTH-1:0];
|
|
(* ram_style = "distributed" *)
|
|
reg [SEG_ADDR_WIDTH-1:0] out_fifo_wr_cmd_addr[2**OUTPUT_FIFO_ADDR_WIDTH-1:0];
|
|
(* ram_style = "distributed" *)
|
|
reg [SEG_DATA_WIDTH-1:0] out_fifo_wr_cmd_data[2**OUTPUT_FIFO_ADDR_WIDTH-1:0];
|
|
|
|
reg [OUTPUT_FIFO_ADDR_WIDTH+1-1:0] done_count_reg = 0;
|
|
reg done_reg = 1'b0;
|
|
|
|
assign ram_wr_cmd_ready_int[n +: 1] = !out_fifo_half_full_reg;
|
|
|
|
assign ram_wr_cmd_sel[n*RAM_SEL_WIDTH +: RAM_SEL_WIDTH] = ram_wr_cmd_sel_reg;
|
|
assign ram_wr_cmd_be[n*SEG_BE_WIDTH +: SEG_BE_WIDTH] = ram_wr_cmd_be_reg;
|
|
assign ram_wr_cmd_addr[n*SEG_ADDR_WIDTH +: SEG_ADDR_WIDTH] = ram_wr_cmd_addr_reg;
|
|
assign ram_wr_cmd_data[n*SEG_DATA_WIDTH +: SEG_DATA_WIDTH] = ram_wr_cmd_data_reg;
|
|
assign ram_wr_cmd_valid[n +: 1] = ram_wr_cmd_valid_reg;
|
|
|
|
assign out_done[n] = done_reg;
|
|
|
|
always @(posedge clk) begin
|
|
ram_wr_cmd_valid_reg <= ram_wr_cmd_valid_reg && !ram_wr_cmd_ready[n +: 1];
|
|
|
|
out_fifo_half_full_reg <= $unsigned(out_fifo_wr_ptr_reg - out_fifo_rd_ptr_reg) >= 2**(OUTPUT_FIFO_ADDR_WIDTH-1);
|
|
|
|
if (!out_fifo_full && ram_wr_cmd_valid_int[n +: 1]) begin
|
|
out_fifo_wr_cmd_sel[out_fifo_wr_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]] <= ram_wr_cmd_sel_int[n*RAM_SEL_WIDTH +: RAM_SEL_WIDTH];
|
|
out_fifo_wr_cmd_be[out_fifo_wr_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]] <= ram_wr_cmd_be_int[n*SEG_BE_WIDTH +: SEG_BE_WIDTH];
|
|
out_fifo_wr_cmd_addr[out_fifo_wr_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]] <= ram_wr_cmd_addr_int[n*SEG_ADDR_WIDTH +: SEG_ADDR_WIDTH];
|
|
out_fifo_wr_cmd_data[out_fifo_wr_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]] <= ram_wr_cmd_data_int[n*SEG_DATA_WIDTH +: SEG_DATA_WIDTH];
|
|
out_fifo_wr_ptr_reg <= out_fifo_wr_ptr_reg + 1;
|
|
end
|
|
|
|
if (!out_fifo_empty && (!ram_wr_cmd_valid_reg || ram_wr_cmd_ready[n +: 1])) begin
|
|
ram_wr_cmd_sel_reg <= out_fifo_wr_cmd_sel[out_fifo_rd_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]];
|
|
ram_wr_cmd_be_reg <= out_fifo_wr_cmd_be[out_fifo_rd_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]];
|
|
ram_wr_cmd_addr_reg <= out_fifo_wr_cmd_addr[out_fifo_rd_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]];
|
|
ram_wr_cmd_data_reg <= out_fifo_wr_cmd_data[out_fifo_rd_ptr_reg[OUTPUT_FIFO_ADDR_WIDTH-1:0]];
|
|
ram_wr_cmd_valid_reg <= 1'b1;
|
|
out_fifo_rd_ptr_reg <= out_fifo_rd_ptr_reg + 1;
|
|
end
|
|
|
|
if (done_count_reg < 2**OUTPUT_FIFO_ADDR_WIDTH && ram_wr_done[n] && !out_done_ack[n]) begin
|
|
done_count_reg <= done_count_reg + 1;
|
|
done_reg <= 1;
|
|
end else if (done_count_reg > 0 && !ram_wr_done[n] && out_done_ack[n]) begin
|
|
done_count_reg <= done_count_reg - 1;
|
|
done_reg <= done_count_reg > 1;
|
|
end
|
|
|
|
if (rst) begin
|
|
out_fifo_wr_ptr_reg <= 0;
|
|
out_fifo_rd_ptr_reg <= 0;
|
|
ram_wr_cmd_valid_reg <= 1'b0;
|
|
done_count_reg <= 0;
|
|
done_reg <= 1'b0;
|
|
end
|
|
end
|
|
|
|
end
|
|
|
|
endgenerate
|
|
|
|
endmodule
|
|
|
|
`resetall
|