mirror of
https://github.com/corundum/corundum.git
synced 2025-01-16 08:12:53 +08:00
424 lines
12 KiB
C
424 lines
12 KiB
C
/*
|
|
|
|
Copyright 2019, The Regents of the University of California.
|
|
All rights reserved.
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
modification, are permitted provided that the following conditions are met:
|
|
|
|
1. Redistributions of source code must retain the above copyright notice,
|
|
this list of conditions and the following disclaimer.
|
|
|
|
2. Redistributions in binary form must reproduce the above copyright notice,
|
|
this list of conditions and the following disclaimer in the documentation
|
|
and/or other materials provided with the distribution.
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE REGENTS OF THE UNIVERSITY OF CALIFORNIA ''AS
|
|
IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
DISCLAIMED. IN NO EVENT SHALL THE REGENTS OF THE UNIVERSITY OF CALIFORNIA OR
|
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT
|
|
OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
|
|
IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY
|
|
OF SUCH DAMAGE.
|
|
|
|
The views and conclusions contained in the software and documentation are those
|
|
of the authors and should not be interpreted as representing official policies,
|
|
either expressed or implied, of The Regents of the University of California.
|
|
|
|
*/
|
|
|
|
#include "mqnic.h"
|
|
|
|
int mqnic_create_rx_ring(struct mqnic_priv *priv, struct mqnic_ring **ring_ptr, int size, int stride, int index, u8 __iomem *hw_addr)
|
|
{
|
|
struct device *dev = priv->dev;
|
|
struct mqnic_ring *ring;
|
|
int ret;
|
|
|
|
ring = kzalloc(sizeof(*ring), GFP_KERNEL);
|
|
if (!ring)
|
|
{
|
|
dev_err(dev, "Failed to allocate RX ring");
|
|
return -ENOMEM;
|
|
}
|
|
|
|
ring->size = roundup_pow_of_two(size);
|
|
ring->size_mask = ring->size-1;
|
|
ring->stride = roundup_pow_of_two(stride);
|
|
|
|
ring->rx_info = kvzalloc(sizeof(*ring->rx_info)*ring->size, GFP_KERNEL);
|
|
if (!ring->rx_info)
|
|
{
|
|
dev_err(dev, "Failed to allocate rx_info");
|
|
ret = -ENOMEM;
|
|
goto fail_ring;
|
|
}
|
|
|
|
ring->buf_size = ring->size*ring->stride;
|
|
ring->buf = dma_alloc_coherent(dev, ring->buf_size, &ring->buf_dma_addr, GFP_KERNEL);
|
|
if (!ring->buf)
|
|
{
|
|
dev_err(dev, "Failed to allocate RX ring DMA buffer");
|
|
ret = -ENOMEM;
|
|
goto fail_info;
|
|
}
|
|
|
|
ring->hw_addr = hw_addr;
|
|
ring->hw_ptr_mask = 0xffff;
|
|
ring->hw_head_ptr = hw_addr+MQNIC_QUEUE_HEAD_PTR_REG;
|
|
ring->hw_tail_ptr = hw_addr+MQNIC_QUEUE_TAIL_PTR_REG;
|
|
|
|
ring->head_ptr = 0;
|
|
ring->tail_ptr = 0;
|
|
ring->clean_tail_ptr = 0;
|
|
|
|
// deactivate queue
|
|
iowrite32(0, ring->hw_addr+MQNIC_QUEUE_ACTIVE_LOG_SIZE_REG);
|
|
// set base address
|
|
iowrite32(ring->buf_dma_addr, ring->hw_addr+MQNIC_QUEUE_BASE_ADDR_REG+0);
|
|
iowrite32(ring->buf_dma_addr >> 32, ring->hw_addr+MQNIC_QUEUE_BASE_ADDR_REG+4);
|
|
// set completion queue index
|
|
iowrite32(0, ring->hw_addr+MQNIC_QUEUE_CPL_QUEUE_INDEX_REG);
|
|
// set pointers
|
|
iowrite32(ring->head_ptr & ring->hw_ptr_mask, ring->hw_addr+MQNIC_QUEUE_HEAD_PTR_REG);
|
|
iowrite32(ring->tail_ptr & ring->hw_ptr_mask, ring->hw_addr+MQNIC_QUEUE_TAIL_PTR_REG);
|
|
// set size
|
|
iowrite32(ilog2(ring->size), ring->hw_addr+MQNIC_QUEUE_ACTIVE_LOG_SIZE_REG);
|
|
|
|
*ring_ptr = ring;
|
|
return 0;
|
|
|
|
fail_info:
|
|
kvfree(ring->rx_info);
|
|
ring->rx_info = NULL;
|
|
fail_ring:
|
|
kfree(ring);
|
|
*ring_ptr = NULL;
|
|
return ret;
|
|
}
|
|
|
|
void mqnic_destroy_rx_ring(struct mqnic_priv *priv, struct mqnic_ring **ring_ptr)
|
|
{
|
|
struct device *dev = priv->dev;
|
|
struct mqnic_ring *ring = *ring_ptr;
|
|
*ring_ptr = NULL;
|
|
|
|
mqnic_deactivate_rx_ring(priv, ring);
|
|
|
|
mqnic_free_rx_buf(priv, ring);
|
|
|
|
dma_free_coherent(dev, ring->buf_size, ring->buf, ring->buf_dma_addr);
|
|
kvfree(ring->rx_info);
|
|
ring->rx_info = NULL;
|
|
kfree(ring);
|
|
}
|
|
|
|
int mqnic_activate_rx_ring(struct mqnic_priv *priv, struct mqnic_ring *ring, int cpl_index)
|
|
{
|
|
// deactivate queue
|
|
iowrite32(0, ring->hw_addr+MQNIC_QUEUE_ACTIVE_LOG_SIZE_REG);
|
|
// set base address
|
|
iowrite32(ring->buf_dma_addr, ring->hw_addr+MQNIC_QUEUE_BASE_ADDR_REG+0);
|
|
iowrite32(ring->buf_dma_addr >> 32, ring->hw_addr+MQNIC_QUEUE_BASE_ADDR_REG+4);
|
|
// set completion queue index
|
|
iowrite32(cpl_index, ring->hw_addr+MQNIC_QUEUE_CPL_QUEUE_INDEX_REG);
|
|
// set pointers
|
|
iowrite32(ring->head_ptr & ring->hw_ptr_mask, ring->hw_addr+MQNIC_QUEUE_HEAD_PTR_REG);
|
|
iowrite32(ring->tail_ptr & ring->hw_ptr_mask, ring->hw_addr+MQNIC_QUEUE_TAIL_PTR_REG);
|
|
// set size and activate queue
|
|
iowrite32(ilog2(ring->size) | MQNIC_QUEUE_ACTIVE_MASK, ring->hw_addr+MQNIC_QUEUE_ACTIVE_LOG_SIZE_REG);
|
|
|
|
mqnic_refill_rx_buffers(priv, ring);
|
|
|
|
return 0;
|
|
}
|
|
|
|
void mqnic_deactivate_rx_ring(struct mqnic_priv *priv, struct mqnic_ring *ring)
|
|
{
|
|
// deactivate queue
|
|
iowrite32(ilog2(ring->size), ring->hw_addr+MQNIC_QUEUE_ACTIVE_LOG_SIZE_REG);
|
|
}
|
|
|
|
bool mqnic_is_rx_ring_empty(const struct mqnic_ring *ring)
|
|
{
|
|
return ring->head_ptr == ring->clean_tail_ptr;
|
|
}
|
|
|
|
bool mqnic_is_rx_ring_full(const struct mqnic_ring *ring)
|
|
{
|
|
return ring->head_ptr - ring->clean_tail_ptr >= ring->size;
|
|
}
|
|
|
|
void mqnic_rx_read_tail_ptr(struct mqnic_ring *ring)
|
|
{
|
|
ring->tail_ptr += (ioread32(ring->hw_tail_ptr) - ring->tail_ptr) & ring->hw_ptr_mask;
|
|
}
|
|
|
|
void mqnic_rx_write_head_ptr(struct mqnic_ring *ring)
|
|
{
|
|
iowrite32(ring->head_ptr & ring->hw_ptr_mask, ring->hw_head_ptr);
|
|
}
|
|
|
|
void mqnic_free_rx_desc(struct mqnic_priv *priv, struct mqnic_ring *ring, int index)
|
|
{
|
|
struct mqnic_rx_info *rx_info = &ring->rx_info[index];
|
|
struct page *page = rx_info->page;
|
|
|
|
dma_unmap_page(priv->dev, dma_unmap_addr(rx_info, dma_addr), dma_unmap_len(rx_info, len), PCI_DMA_FROMDEVICE);
|
|
rx_info->dma_addr = 0;
|
|
__free_pages(page, rx_info->page_order);
|
|
rx_info->page = NULL;
|
|
}
|
|
|
|
int mqnic_free_rx_buf(struct mqnic_priv *priv, struct mqnic_ring *ring)
|
|
{
|
|
u32 index;
|
|
int cnt = 0;
|
|
|
|
while (!mqnic_is_rx_ring_empty(ring))
|
|
{
|
|
index = ring->clean_tail_ptr & ring->size_mask;
|
|
mqnic_free_rx_desc(priv, ring, index);
|
|
ring->clean_tail_ptr++;
|
|
cnt++;
|
|
}
|
|
|
|
ring->head_ptr = 0;
|
|
ring->tail_ptr = 0;
|
|
ring->clean_tail_ptr = 0;
|
|
|
|
return cnt;
|
|
}
|
|
|
|
int mqnic_prepare_rx_desc(struct mqnic_priv *priv, struct mqnic_ring *ring, int index)
|
|
{
|
|
struct mqnic_rx_info *rx_info = &ring->rx_info[index];
|
|
struct mqnic_desc *rx_desc = (struct mqnic_desc *)(ring->buf + index*ring->stride);
|
|
struct page *page = rx_info->page;
|
|
u32 page_order = ring->page_order;
|
|
u32 len = PAGE_SIZE << page_order;
|
|
dma_addr_t dma_addr;
|
|
|
|
if (unlikely(page))
|
|
{
|
|
dev_err(&priv->mdev->pdev->dev, "mqnic_prepare_rx_desc skb not yet processed on port %d", priv->port);
|
|
return -1;
|
|
}
|
|
|
|
page = dev_alloc_pages(page_order);
|
|
if (unlikely(!page))
|
|
{
|
|
dev_err(&priv->mdev->pdev->dev, "mqnic_prepare_rx_desc failed to allocate memory on port %d", priv->port);
|
|
return -1;
|
|
}
|
|
|
|
// map page
|
|
dma_addr = dma_map_page(priv->dev, page, 0, len, PCI_DMA_FROMDEVICE);
|
|
|
|
if (unlikely(dma_mapping_error(priv->dev, dma_addr)))
|
|
{
|
|
dev_err(&priv->mdev->pdev->dev, "mqnic_prepare_rx_desc DMA mapping failed on port %d", priv->port);
|
|
__free_pages(page, page_order);
|
|
return -1;
|
|
}
|
|
|
|
// write descriptor
|
|
rx_desc->len = len;
|
|
rx_desc->addr = dma_addr;
|
|
|
|
// update rx_info
|
|
rx_info->page = page;
|
|
rx_info->page_order = page_order;
|
|
rx_info->page_offset = 0;
|
|
rx_info->dma_addr = dma_addr;
|
|
rx_info->len = len;
|
|
|
|
return 0;
|
|
}
|
|
|
|
void mqnic_refill_rx_buffers(struct mqnic_priv *priv, struct mqnic_ring *ring)
|
|
{
|
|
u32 missing = ring->size - (ring->head_ptr - ring->clean_tail_ptr);
|
|
|
|
if (missing < 8)
|
|
return;
|
|
|
|
for ( ; missing-- > 0; )
|
|
{
|
|
if (mqnic_prepare_rx_desc(priv, ring, ring->head_ptr & ring->size_mask))
|
|
break;
|
|
ring->head_ptr++;
|
|
}
|
|
|
|
// enqueue on NIC
|
|
dma_wmb();
|
|
mqnic_rx_write_head_ptr(ring);
|
|
}
|
|
|
|
int mqnic_process_rx_cq(struct net_device *ndev, struct mqnic_cq_ring *cq_ring, int napi_budget)
|
|
{
|
|
struct mqnic_priv *priv = netdev_priv(ndev);
|
|
struct mqnic_ring *ring = priv->rx_ring[cq_ring->ring_index];
|
|
struct mqnic_rx_info *rx_info;
|
|
struct mqnic_cpl *cpl;
|
|
struct sk_buff *skb;
|
|
struct page *page;
|
|
u32 cq_index;
|
|
u32 cq_tail_ptr;
|
|
u32 ring_index;
|
|
u32 ring_clean_tail_ptr;
|
|
int done = 0;
|
|
int budget = napi_budget;
|
|
u32 len;
|
|
|
|
if (unlikely(!priv->port_up))
|
|
{
|
|
return done;
|
|
}
|
|
|
|
// process completion queue
|
|
// read head pointer from NIC
|
|
mqnic_cq_read_head_ptr(cq_ring);
|
|
|
|
cq_tail_ptr = cq_ring->tail_ptr;
|
|
cq_index = cq_tail_ptr & cq_ring->size_mask;
|
|
|
|
mb(); // is a barrier here necessary? If so, what kind?
|
|
|
|
while (cq_ring->head_ptr != cq_tail_ptr && done < budget)
|
|
{
|
|
cpl = (struct mqnic_cpl *)(cq_ring->buf + cq_index*cq_ring->stride);
|
|
ring_index = cpl->index & ring->size_mask;
|
|
rx_info = &ring->rx_info[ring_index];
|
|
page = rx_info->page;
|
|
|
|
if (unlikely(!page))
|
|
{
|
|
dev_err(&priv->mdev->pdev->dev, "mqnic_process_rx_cq ring %d null page at index %d", cq_ring->ring_index, ring_index);
|
|
print_hex_dump(KERN_ERR, "", DUMP_PREFIX_NONE, 16, 1, cpl, MQNIC_CPL_SIZE, true);
|
|
break;
|
|
}
|
|
|
|
skb = napi_get_frags(&cq_ring->napi);
|
|
if (unlikely(!skb))
|
|
{
|
|
dev_err(&priv->mdev->pdev->dev, "mqnic_process_rx_cq ring %d failed to allocate skb", cq_ring->ring_index);
|
|
break;
|
|
}
|
|
|
|
// RX hardware timestamp
|
|
if (priv->if_features & MQNIC_IF_FEATURE_PTP_TS)
|
|
{
|
|
skb_hwtstamps(skb)->hwtstamp = mqnic_read_cpl_ts(priv->mdev, ring, cpl);
|
|
}
|
|
|
|
skb_record_rx_queue(skb, cq_ring->ring_index);
|
|
|
|
// RX hardware checksum
|
|
if ((ndev->features & NETIF_F_RXCSUM) &&
|
|
(skb->protocol == htons(ETH_P_IP) || skb->protocol == htons(ETH_P_IPV6)) &&
|
|
(skb->len >= 64))
|
|
{
|
|
|
|
skb->csum = be16_to_cpu(cpl->rx_csum);
|
|
skb->ip_summed = CHECKSUM_COMPLETE;
|
|
}
|
|
|
|
// unmap
|
|
dma_unmap_page(priv->dev, dma_unmap_addr(rx_info, dma_addr), dma_unmap_len(rx_info, len), PCI_DMA_FROMDEVICE);
|
|
rx_info->dma_addr = 0;
|
|
|
|
len = min_t(u32, cpl->len, rx_info->len);
|
|
|
|
dma_sync_single_range_for_cpu(priv->dev, rx_info->dma_addr, rx_info->page_offset, rx_info->len, PCI_DMA_FROMDEVICE);
|
|
|
|
__skb_fill_page_desc(skb, 0, page, rx_info->page_offset, len);
|
|
rx_info->page = NULL;
|
|
|
|
skb_shinfo(skb)->nr_frags = 1;
|
|
skb->len = len;
|
|
skb->data_len = len;
|
|
skb->truesize += rx_info->len;
|
|
|
|
// hand off SKB
|
|
napi_gro_frags(&cq_ring->napi);
|
|
|
|
ring->packets++;
|
|
ring->bytes += cpl->len;
|
|
|
|
done++;
|
|
|
|
cq_tail_ptr++;
|
|
cq_index = cq_tail_ptr & cq_ring->size_mask;
|
|
}
|
|
|
|
// update CQ tail
|
|
cq_ring->tail_ptr = cq_tail_ptr;
|
|
mqnic_cq_write_tail_ptr(cq_ring);
|
|
|
|
// process ring
|
|
// read tail pointer from NIC
|
|
mqnic_rx_read_tail_ptr(ring);
|
|
|
|
ring_clean_tail_ptr = READ_ONCE(ring->clean_tail_ptr);
|
|
ring_index = ring_clean_tail_ptr & ring->size_mask;
|
|
|
|
while (ring_clean_tail_ptr != ring->tail_ptr)
|
|
{
|
|
rx_info = &ring->rx_info[ring_index];
|
|
|
|
if (rx_info->page)
|
|
break;
|
|
|
|
ring_clean_tail_ptr++;
|
|
ring_index = ring_clean_tail_ptr & ring->size_mask;
|
|
}
|
|
|
|
// update ring tail
|
|
WRITE_ONCE(ring->clean_tail_ptr, ring_clean_tail_ptr);
|
|
|
|
// replenish buffers
|
|
mqnic_refill_rx_buffers(priv, ring);
|
|
|
|
return done;
|
|
}
|
|
|
|
void mqnic_rx_irq(struct mqnic_cq_ring *cq)
|
|
{
|
|
struct mqnic_priv *priv = netdev_priv(cq->ndev);
|
|
|
|
if (likely(priv->port_up))
|
|
{
|
|
napi_schedule_irqoff(&cq->napi);
|
|
}
|
|
else
|
|
{
|
|
mqnic_arm_cq(cq);
|
|
}
|
|
}
|
|
|
|
int mqnic_poll_rx_cq(struct napi_struct *napi, int budget)
|
|
{
|
|
struct mqnic_cq_ring *cq_ring = container_of(napi, struct mqnic_cq_ring, napi);
|
|
struct net_device *ndev = cq_ring->ndev;
|
|
int done;
|
|
|
|
done = mqnic_process_rx_cq(ndev, cq_ring, budget);
|
|
|
|
if (done == budget)
|
|
{
|
|
return done;
|
|
}
|
|
|
|
napi_complete(napi);
|
|
|
|
mqnic_arm_cq(cq_ring);
|
|
|
|
return done;
|
|
}
|
|
|