| // SPDX-License-Identifier: GPL-2.0-only |
| /* Copyright (C) 2023 Intel Corporation */ |
| |
| #include "idpf.h" |
| #include "idpf_virtchnl.h" |
| |
| /** |
| * idpf_buf_lifo_push - push a buffer pointer onto stack |
| * @stack: pointer to stack struct |
| * @buf: pointer to buf to push |
| * |
| * Returns 0 on success, negative on failure |
| **/ |
| static int idpf_buf_lifo_push(struct idpf_buf_lifo *stack, |
| struct idpf_tx_stash *buf) |
| { |
| if (unlikely(stack->top == stack->size)) |
| return -ENOSPC; |
| |
| stack->bufs[stack->top++] = buf; |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_buf_lifo_pop - pop a buffer pointer from stack |
| * @stack: pointer to stack struct |
| **/ |
| static struct idpf_tx_stash *idpf_buf_lifo_pop(struct idpf_buf_lifo *stack) |
| { |
| if (unlikely(!stack->top)) |
| return NULL; |
| |
| return stack->bufs[--stack->top]; |
| } |
| |
| /** |
| * idpf_tx_timeout - Respond to a Tx Hang |
| * @netdev: network interface device structure |
| * @txqueue: TX queue |
| */ |
| void idpf_tx_timeout(struct net_device *netdev, unsigned int txqueue) |
| { |
| struct idpf_adapter *adapter = idpf_netdev_to_adapter(netdev); |
| |
| adapter->tx_timeout_count++; |
| |
| netdev_err(netdev, "Detected Tx timeout: Count %d, Queue %d\n", |
| adapter->tx_timeout_count, txqueue); |
| if (!idpf_is_reset_in_prog(adapter)) { |
| set_bit(IDPF_HR_FUNC_RESET, adapter->flags); |
| queue_delayed_work(adapter->vc_event_wq, |
| &adapter->vc_event_task, |
| msecs_to_jiffies(10)); |
| } |
| } |
| |
| /** |
| * idpf_tx_buf_rel - Release a Tx buffer |
| * @tx_q: the queue that owns the buffer |
| * @tx_buf: the buffer to free |
| */ |
| static void idpf_tx_buf_rel(struct idpf_queue *tx_q, struct idpf_tx_buf *tx_buf) |
| { |
| if (tx_buf->skb) { |
| if (dma_unmap_len(tx_buf, len)) |
| dma_unmap_single(tx_q->dev, |
| dma_unmap_addr(tx_buf, dma), |
| dma_unmap_len(tx_buf, len), |
| DMA_TO_DEVICE); |
| dev_kfree_skb_any(tx_buf->skb); |
| } else if (dma_unmap_len(tx_buf, len)) { |
| dma_unmap_page(tx_q->dev, |
| dma_unmap_addr(tx_buf, dma), |
| dma_unmap_len(tx_buf, len), |
| DMA_TO_DEVICE); |
| } |
| |
| tx_buf->next_to_watch = NULL; |
| tx_buf->skb = NULL; |
| tx_buf->compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; |
| dma_unmap_len_set(tx_buf, len, 0); |
| } |
| |
| /** |
| * idpf_tx_buf_rel_all - Free any empty Tx buffers |
| * @txq: queue to be cleaned |
| */ |
| static void idpf_tx_buf_rel_all(struct idpf_queue *txq) |
| { |
| u16 i; |
| |
| /* Buffers already cleared, nothing to do */ |
| if (!txq->tx_buf) |
| return; |
| |
| /* Free all the Tx buffer sk_buffs */ |
| for (i = 0; i < txq->desc_count; i++) |
| idpf_tx_buf_rel(txq, &txq->tx_buf[i]); |
| |
| kfree(txq->tx_buf); |
| txq->tx_buf = NULL; |
| |
| if (!txq->buf_stack.bufs) |
| return; |
| |
| for (i = 0; i < txq->buf_stack.size; i++) |
| kfree(txq->buf_stack.bufs[i]); |
| |
| kfree(txq->buf_stack.bufs); |
| txq->buf_stack.bufs = NULL; |
| } |
| |
| /** |
| * idpf_tx_desc_rel - Free Tx resources per queue |
| * @txq: Tx descriptor ring for a specific queue |
| * @bufq: buffer q or completion q |
| * |
| * Free all transmit software resources |
| */ |
| static void idpf_tx_desc_rel(struct idpf_queue *txq, bool bufq) |
| { |
| if (bufq) |
| idpf_tx_buf_rel_all(txq); |
| |
| if (!txq->desc_ring) |
| return; |
| |
| dmam_free_coherent(txq->dev, txq->size, txq->desc_ring, txq->dma); |
| txq->desc_ring = NULL; |
| txq->next_to_alloc = 0; |
| txq->next_to_use = 0; |
| txq->next_to_clean = 0; |
| } |
| |
| /** |
| * idpf_tx_desc_rel_all - Free Tx Resources for All Queues |
| * @vport: virtual port structure |
| * |
| * Free all transmit software resources |
| */ |
| static void idpf_tx_desc_rel_all(struct idpf_vport *vport) |
| { |
| int i, j; |
| |
| if (!vport->txq_grps) |
| return; |
| |
| for (i = 0; i < vport->num_txq_grp; i++) { |
| struct idpf_txq_group *txq_grp = &vport->txq_grps[i]; |
| |
| for (j = 0; j < txq_grp->num_txq; j++) |
| idpf_tx_desc_rel(txq_grp->txqs[j], true); |
| |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| idpf_tx_desc_rel(txq_grp->complq, false); |
| } |
| } |
| |
| /** |
| * idpf_tx_buf_alloc_all - Allocate memory for all buffer resources |
| * @tx_q: queue for which the buffers are allocated |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_tx_buf_alloc_all(struct idpf_queue *tx_q) |
| { |
| int buf_size; |
| int i; |
| |
| /* Allocate book keeping buffers only. Buffers to be supplied to HW |
| * are allocated by kernel network stack and received as part of skb |
| */ |
| buf_size = sizeof(struct idpf_tx_buf) * tx_q->desc_count; |
| tx_q->tx_buf = kzalloc(buf_size, GFP_KERNEL); |
| if (!tx_q->tx_buf) |
| return -ENOMEM; |
| |
| /* Initialize tx_bufs with invalid completion tags */ |
| for (i = 0; i < tx_q->desc_count; i++) |
| tx_q->tx_buf[i].compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; |
| |
| /* Initialize tx buf stack for out-of-order completions if |
| * flow scheduling offload is enabled |
| */ |
| tx_q->buf_stack.bufs = |
| kcalloc(tx_q->desc_count, sizeof(struct idpf_tx_stash *), |
| GFP_KERNEL); |
| if (!tx_q->buf_stack.bufs) |
| return -ENOMEM; |
| |
| tx_q->buf_stack.size = tx_q->desc_count; |
| tx_q->buf_stack.top = tx_q->desc_count; |
| |
| for (i = 0; i < tx_q->desc_count; i++) { |
| tx_q->buf_stack.bufs[i] = kzalloc(sizeof(*tx_q->buf_stack.bufs[i]), |
| GFP_KERNEL); |
| if (!tx_q->buf_stack.bufs[i]) |
| return -ENOMEM; |
| } |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_tx_desc_alloc - Allocate the Tx descriptors |
| * @tx_q: the tx ring to set up |
| * @bufq: buffer or completion queue |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_tx_desc_alloc(struct idpf_queue *tx_q, bool bufq) |
| { |
| struct device *dev = tx_q->dev; |
| u32 desc_sz; |
| int err; |
| |
| if (bufq) { |
| err = idpf_tx_buf_alloc_all(tx_q); |
| if (err) |
| goto err_alloc; |
| |
| desc_sz = sizeof(struct idpf_base_tx_desc); |
| } else { |
| desc_sz = sizeof(struct idpf_splitq_tx_compl_desc); |
| } |
| |
| tx_q->size = tx_q->desc_count * desc_sz; |
| |
| /* Allocate descriptors also round up to nearest 4K */ |
| tx_q->size = ALIGN(tx_q->size, 4096); |
| tx_q->desc_ring = dmam_alloc_coherent(dev, tx_q->size, &tx_q->dma, |
| GFP_KERNEL); |
| if (!tx_q->desc_ring) { |
| dev_err(dev, "Unable to allocate memory for the Tx descriptor ring, size=%d\n", |
| tx_q->size); |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| |
| tx_q->next_to_alloc = 0; |
| tx_q->next_to_use = 0; |
| tx_q->next_to_clean = 0; |
| set_bit(__IDPF_Q_GEN_CHK, tx_q->flags); |
| |
| return 0; |
| |
| err_alloc: |
| idpf_tx_desc_rel(tx_q, bufq); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_tx_desc_alloc_all - allocate all queues Tx resources |
| * @vport: virtual port private structure |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_tx_desc_alloc_all(struct idpf_vport *vport) |
| { |
| struct device *dev = &vport->adapter->pdev->dev; |
| int err = 0; |
| int i, j; |
| |
| /* Setup buffer queues. In single queue model buffer queues and |
| * completion queues will be same |
| */ |
| for (i = 0; i < vport->num_txq_grp; i++) { |
| for (j = 0; j < vport->txq_grps[i].num_txq; j++) { |
| struct idpf_queue *txq = vport->txq_grps[i].txqs[j]; |
| u8 gen_bits = 0; |
| u16 bufidx_mask; |
| |
| err = idpf_tx_desc_alloc(txq, true); |
| if (err) { |
| dev_err(dev, "Allocation for Tx Queue %u failed\n", |
| i); |
| goto err_out; |
| } |
| |
| if (!idpf_is_queue_model_split(vport->txq_model)) |
| continue; |
| |
| txq->compl_tag_cur_gen = 0; |
| |
| /* Determine the number of bits in the bufid |
| * mask and add one to get the start of the |
| * generation bits |
| */ |
| bufidx_mask = txq->desc_count - 1; |
| while (bufidx_mask >> 1) { |
| txq->compl_tag_gen_s++; |
| bufidx_mask = bufidx_mask >> 1; |
| } |
| txq->compl_tag_gen_s++; |
| |
| gen_bits = IDPF_TX_SPLITQ_COMPL_TAG_WIDTH - |
| txq->compl_tag_gen_s; |
| txq->compl_tag_gen_max = GETMAXVAL(gen_bits); |
| |
| /* Set bufid mask based on location of first |
| * gen bit; it cannot simply be the descriptor |
| * ring size-1 since we can have size values |
| * where not all of those bits are set. |
| */ |
| txq->compl_tag_bufid_m = |
| GETMAXVAL(txq->compl_tag_gen_s); |
| } |
| |
| if (!idpf_is_queue_model_split(vport->txq_model)) |
| continue; |
| |
| /* Setup completion queues */ |
| err = idpf_tx_desc_alloc(vport->txq_grps[i].complq, false); |
| if (err) { |
| dev_err(dev, "Allocation for Tx Completion Queue %u failed\n", |
| i); |
| goto err_out; |
| } |
| } |
| |
| err_out: |
| if (err) |
| idpf_tx_desc_rel_all(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_rx_page_rel - Release an rx buffer page |
| * @rxq: the queue that owns the buffer |
| * @rx_buf: the buffer to free |
| */ |
| static void idpf_rx_page_rel(struct idpf_queue *rxq, struct idpf_rx_buf *rx_buf) |
| { |
| if (unlikely(!rx_buf->page)) |
| return; |
| |
| page_pool_put_full_page(rxq->pp, rx_buf->page, false); |
| |
| rx_buf->page = NULL; |
| rx_buf->page_offset = 0; |
| } |
| |
| /** |
| * idpf_rx_hdr_buf_rel_all - Release header buffer memory |
| * @rxq: queue to use |
| */ |
| static void idpf_rx_hdr_buf_rel_all(struct idpf_queue *rxq) |
| { |
| struct idpf_adapter *adapter = rxq->vport->adapter; |
| |
| dma_free_coherent(&adapter->pdev->dev, |
| rxq->desc_count * IDPF_HDR_BUF_SIZE, |
| rxq->rx_buf.hdr_buf_va, |
| rxq->rx_buf.hdr_buf_pa); |
| rxq->rx_buf.hdr_buf_va = NULL; |
| } |
| |
| /** |
| * idpf_rx_buf_rel_all - Free all Rx buffer resources for a queue |
| * @rxq: queue to be cleaned |
| */ |
| static void idpf_rx_buf_rel_all(struct idpf_queue *rxq) |
| { |
| u16 i; |
| |
| /* queue already cleared, nothing to do */ |
| if (!rxq->rx_buf.buf) |
| return; |
| |
| /* Free all the bufs allocated and given to hw on Rx queue */ |
| for (i = 0; i < rxq->desc_count; i++) |
| idpf_rx_page_rel(rxq, &rxq->rx_buf.buf[i]); |
| |
| if (rxq->rx_hsplit_en) |
| idpf_rx_hdr_buf_rel_all(rxq); |
| |
| page_pool_destroy(rxq->pp); |
| rxq->pp = NULL; |
| |
| kfree(rxq->rx_buf.buf); |
| rxq->rx_buf.buf = NULL; |
| } |
| |
| /** |
| * idpf_rx_desc_rel - Free a specific Rx q resources |
| * @rxq: queue to clean the resources from |
| * @bufq: buffer q or completion q |
| * @q_model: single or split q model |
| * |
| * Free a specific rx queue resources |
| */ |
| static void idpf_rx_desc_rel(struct idpf_queue *rxq, bool bufq, s32 q_model) |
| { |
| if (!rxq) |
| return; |
| |
| if (rxq->skb) { |
| dev_kfree_skb_any(rxq->skb); |
| rxq->skb = NULL; |
| } |
| |
| if (bufq || !idpf_is_queue_model_split(q_model)) |
| idpf_rx_buf_rel_all(rxq); |
| |
| rxq->next_to_alloc = 0; |
| rxq->next_to_clean = 0; |
| rxq->next_to_use = 0; |
| if (!rxq->desc_ring) |
| return; |
| |
| dmam_free_coherent(rxq->dev, rxq->size, rxq->desc_ring, rxq->dma); |
| rxq->desc_ring = NULL; |
| } |
| |
| /** |
| * idpf_rx_desc_rel_all - Free Rx Resources for All Queues |
| * @vport: virtual port structure |
| * |
| * Free all rx queues resources |
| */ |
| static void idpf_rx_desc_rel_all(struct idpf_vport *vport) |
| { |
| struct idpf_rxq_group *rx_qgrp; |
| u16 num_rxq; |
| int i, j; |
| |
| if (!vport->rxq_grps) |
| return; |
| |
| for (i = 0; i < vport->num_rxq_grp; i++) { |
| rx_qgrp = &vport->rxq_grps[i]; |
| |
| if (!idpf_is_queue_model_split(vport->rxq_model)) { |
| for (j = 0; j < rx_qgrp->singleq.num_rxq; j++) |
| idpf_rx_desc_rel(rx_qgrp->singleq.rxqs[j], |
| false, vport->rxq_model); |
| continue; |
| } |
| |
| num_rxq = rx_qgrp->splitq.num_rxq_sets; |
| for (j = 0; j < num_rxq; j++) |
| idpf_rx_desc_rel(&rx_qgrp->splitq.rxq_sets[j]->rxq, |
| false, vport->rxq_model); |
| |
| if (!rx_qgrp->splitq.bufq_sets) |
| continue; |
| |
| for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { |
| struct idpf_bufq_set *bufq_set = |
| &rx_qgrp->splitq.bufq_sets[j]; |
| |
| idpf_rx_desc_rel(&bufq_set->bufq, true, |
| vport->rxq_model); |
| } |
| } |
| } |
| |
| /** |
| * idpf_rx_buf_hw_update - Store the new tail and head values |
| * @rxq: queue to bump |
| * @val: new head index |
| */ |
| void idpf_rx_buf_hw_update(struct idpf_queue *rxq, u32 val) |
| { |
| rxq->next_to_use = val; |
| |
| if (unlikely(!rxq->tail)) |
| return; |
| |
| /* writel has an implicit memory barrier */ |
| writel(val, rxq->tail); |
| } |
| |
| /** |
| * idpf_rx_hdr_buf_alloc_all - Allocate memory for header buffers |
| * @rxq: ring to use |
| * |
| * Returns 0 on success, negative on failure. |
| */ |
| static int idpf_rx_hdr_buf_alloc_all(struct idpf_queue *rxq) |
| { |
| struct idpf_adapter *adapter = rxq->vport->adapter; |
| |
| rxq->rx_buf.hdr_buf_va = |
| dma_alloc_coherent(&adapter->pdev->dev, |
| IDPF_HDR_BUF_SIZE * rxq->desc_count, |
| &rxq->rx_buf.hdr_buf_pa, |
| GFP_KERNEL); |
| if (!rxq->rx_buf.hdr_buf_va) |
| return -ENOMEM; |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_rx_post_buf_refill - Post buffer id to refill queue |
| * @refillq: refill queue to post to |
| * @buf_id: buffer id to post |
| */ |
| static void idpf_rx_post_buf_refill(struct idpf_sw_queue *refillq, u16 buf_id) |
| { |
| u16 nta = refillq->next_to_alloc; |
| |
| /* store the buffer ID and the SW maintained GEN bit to the refillq */ |
| refillq->ring[nta] = |
| FIELD_PREP(IDPF_RX_BI_BUFID_M, buf_id) | |
| FIELD_PREP(IDPF_RX_BI_GEN_M, |
| test_bit(__IDPF_Q_GEN_CHK, refillq->flags)); |
| |
| if (unlikely(++nta == refillq->desc_count)) { |
| nta = 0; |
| change_bit(__IDPF_Q_GEN_CHK, refillq->flags); |
| } |
| refillq->next_to_alloc = nta; |
| } |
| |
| /** |
| * idpf_rx_post_buf_desc - Post buffer to bufq descriptor ring |
| * @bufq: buffer queue to post to |
| * @buf_id: buffer id to post |
| * |
| * Returns false if buffer could not be allocated, true otherwise. |
| */ |
| static bool idpf_rx_post_buf_desc(struct idpf_queue *bufq, u16 buf_id) |
| { |
| struct virtchnl2_splitq_rx_buf_desc *splitq_rx_desc = NULL; |
| u16 nta = bufq->next_to_alloc; |
| struct idpf_rx_buf *buf; |
| dma_addr_t addr; |
| |
| splitq_rx_desc = IDPF_SPLITQ_RX_BUF_DESC(bufq, nta); |
| buf = &bufq->rx_buf.buf[buf_id]; |
| |
| if (bufq->rx_hsplit_en) { |
| splitq_rx_desc->hdr_addr = |
| cpu_to_le64(bufq->rx_buf.hdr_buf_pa + |
| (u32)buf_id * IDPF_HDR_BUF_SIZE); |
| } |
| |
| addr = idpf_alloc_page(bufq->pp, buf, bufq->rx_buf_size); |
| if (unlikely(addr == DMA_MAPPING_ERROR)) |
| return false; |
| |
| splitq_rx_desc->pkt_addr = cpu_to_le64(addr); |
| splitq_rx_desc->qword0.buf_id = cpu_to_le16(buf_id); |
| |
| nta++; |
| if (unlikely(nta == bufq->desc_count)) |
| nta = 0; |
| bufq->next_to_alloc = nta; |
| |
| return true; |
| } |
| |
| /** |
| * idpf_rx_post_init_bufs - Post initial buffers to bufq |
| * @bufq: buffer queue to post working set to |
| * @working_set: number of buffers to put in working set |
| * |
| * Returns true if @working_set bufs were posted successfully, false otherwise. |
| */ |
| static bool idpf_rx_post_init_bufs(struct idpf_queue *bufq, u16 working_set) |
| { |
| int i; |
| |
| for (i = 0; i < working_set; i++) { |
| if (!idpf_rx_post_buf_desc(bufq, i)) |
| return false; |
| } |
| |
| idpf_rx_buf_hw_update(bufq, |
| bufq->next_to_alloc & ~(bufq->rx_buf_stride - 1)); |
| |
| return true; |
| } |
| |
| /** |
| * idpf_rx_create_page_pool - Create a page pool |
| * @rxbufq: RX queue to create page pool for |
| * |
| * Returns &page_pool on success, casted -errno on failure |
| */ |
| static struct page_pool *idpf_rx_create_page_pool(struct idpf_queue *rxbufq) |
| { |
| struct page_pool_params pp = { |
| .flags = PP_FLAG_DMA_MAP | PP_FLAG_DMA_SYNC_DEV, |
| .order = 0, |
| .pool_size = rxbufq->desc_count, |
| .nid = NUMA_NO_NODE, |
| .dev = rxbufq->vport->netdev->dev.parent, |
| .max_len = PAGE_SIZE, |
| .dma_dir = DMA_FROM_DEVICE, |
| .offset = 0, |
| }; |
| |
| return page_pool_create(&pp); |
| } |
| |
| /** |
| * idpf_rx_buf_alloc_all - Allocate memory for all buffer resources |
| * @rxbufq: queue for which the buffers are allocated; equivalent to |
| * rxq when operating in singleq mode |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_rx_buf_alloc_all(struct idpf_queue *rxbufq) |
| { |
| int err = 0; |
| |
| /* Allocate book keeping buffers */ |
| rxbufq->rx_buf.buf = kcalloc(rxbufq->desc_count, |
| sizeof(struct idpf_rx_buf), GFP_KERNEL); |
| if (!rxbufq->rx_buf.buf) { |
| err = -ENOMEM; |
| goto rx_buf_alloc_all_out; |
| } |
| |
| if (rxbufq->rx_hsplit_en) { |
| err = idpf_rx_hdr_buf_alloc_all(rxbufq); |
| if (err) |
| goto rx_buf_alloc_all_out; |
| } |
| |
| /* Allocate buffers to be given to HW. */ |
| if (idpf_is_queue_model_split(rxbufq->vport->rxq_model)) { |
| int working_set = IDPF_RX_BUFQ_WORKING_SET(rxbufq); |
| |
| if (!idpf_rx_post_init_bufs(rxbufq, working_set)) |
| err = -ENOMEM; |
| } else { |
| if (idpf_rx_singleq_buf_hw_alloc_all(rxbufq, |
| rxbufq->desc_count - 1)) |
| err = -ENOMEM; |
| } |
| |
| rx_buf_alloc_all_out: |
| if (err) |
| idpf_rx_buf_rel_all(rxbufq); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_rx_bufs_init - Initialize page pool, allocate rx bufs, and post to HW |
| * @rxbufq: RX queue to create page pool for |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_rx_bufs_init(struct idpf_queue *rxbufq) |
| { |
| struct page_pool *pool; |
| |
| pool = idpf_rx_create_page_pool(rxbufq); |
| if (IS_ERR(pool)) |
| return PTR_ERR(pool); |
| |
| rxbufq->pp = pool; |
| |
| return idpf_rx_buf_alloc_all(rxbufq); |
| } |
| |
| /** |
| * idpf_rx_bufs_init_all - Initialize all RX bufs |
| * @vport: virtual port struct |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| int idpf_rx_bufs_init_all(struct idpf_vport *vport) |
| { |
| struct idpf_rxq_group *rx_qgrp; |
| struct idpf_queue *q; |
| int i, j, err; |
| |
| for (i = 0; i < vport->num_rxq_grp; i++) { |
| rx_qgrp = &vport->rxq_grps[i]; |
| |
| /* Allocate bufs for the rxq itself in singleq */ |
| if (!idpf_is_queue_model_split(vport->rxq_model)) { |
| int num_rxq = rx_qgrp->singleq.num_rxq; |
| |
| for (j = 0; j < num_rxq; j++) { |
| q = rx_qgrp->singleq.rxqs[j]; |
| err = idpf_rx_bufs_init(q); |
| if (err) |
| return err; |
| } |
| |
| continue; |
| } |
| |
| /* Otherwise, allocate bufs for the buffer queues */ |
| for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { |
| q = &rx_qgrp->splitq.bufq_sets[j].bufq; |
| err = idpf_rx_bufs_init(q); |
| if (err) |
| return err; |
| } |
| } |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_rx_desc_alloc - Allocate queue Rx resources |
| * @rxq: Rx queue for which the resources are setup |
| * @bufq: buffer or completion queue |
| * @q_model: single or split queue model |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_rx_desc_alloc(struct idpf_queue *rxq, bool bufq, s32 q_model) |
| { |
| struct device *dev = rxq->dev; |
| |
| if (bufq) |
| rxq->size = rxq->desc_count * |
| sizeof(struct virtchnl2_splitq_rx_buf_desc); |
| else |
| rxq->size = rxq->desc_count * |
| sizeof(union virtchnl2_rx_desc); |
| |
| /* Allocate descriptors and also round up to nearest 4K */ |
| rxq->size = ALIGN(rxq->size, 4096); |
| rxq->desc_ring = dmam_alloc_coherent(dev, rxq->size, |
| &rxq->dma, GFP_KERNEL); |
| if (!rxq->desc_ring) { |
| dev_err(dev, "Unable to allocate memory for the Rx descriptor ring, size=%d\n", |
| rxq->size); |
| return -ENOMEM; |
| } |
| |
| rxq->next_to_alloc = 0; |
| rxq->next_to_clean = 0; |
| rxq->next_to_use = 0; |
| set_bit(__IDPF_Q_GEN_CHK, rxq->flags); |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_rx_desc_alloc_all - allocate all RX queues resources |
| * @vport: virtual port structure |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_rx_desc_alloc_all(struct idpf_vport *vport) |
| { |
| struct device *dev = &vport->adapter->pdev->dev; |
| struct idpf_rxq_group *rx_qgrp; |
| struct idpf_queue *q; |
| int i, j, err; |
| u16 num_rxq; |
| |
| for (i = 0; i < vport->num_rxq_grp; i++) { |
| rx_qgrp = &vport->rxq_grps[i]; |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| num_rxq = rx_qgrp->splitq.num_rxq_sets; |
| else |
| num_rxq = rx_qgrp->singleq.num_rxq; |
| |
| for (j = 0; j < num_rxq; j++) { |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| q = &rx_qgrp->splitq.rxq_sets[j]->rxq; |
| else |
| q = rx_qgrp->singleq.rxqs[j]; |
| err = idpf_rx_desc_alloc(q, false, vport->rxq_model); |
| if (err) { |
| dev_err(dev, "Memory allocation for Rx Queue %u failed\n", |
| i); |
| goto err_out; |
| } |
| } |
| |
| if (!idpf_is_queue_model_split(vport->rxq_model)) |
| continue; |
| |
| for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { |
| q = &rx_qgrp->splitq.bufq_sets[j].bufq; |
| err = idpf_rx_desc_alloc(q, true, vport->rxq_model); |
| if (err) { |
| dev_err(dev, "Memory allocation for Rx Buffer Queue %u failed\n", |
| i); |
| goto err_out; |
| } |
| } |
| } |
| |
| return 0; |
| |
| err_out: |
| idpf_rx_desc_rel_all(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_txq_group_rel - Release all resources for txq groups |
| * @vport: vport to release txq groups on |
| */ |
| static void idpf_txq_group_rel(struct idpf_vport *vport) |
| { |
| int i, j; |
| |
| if (!vport->txq_grps) |
| return; |
| |
| for (i = 0; i < vport->num_txq_grp; i++) { |
| struct idpf_txq_group *txq_grp = &vport->txq_grps[i]; |
| |
| for (j = 0; j < txq_grp->num_txq; j++) { |
| kfree(txq_grp->txqs[j]); |
| txq_grp->txqs[j] = NULL; |
| } |
| kfree(txq_grp->complq); |
| txq_grp->complq = NULL; |
| } |
| kfree(vport->txq_grps); |
| vport->txq_grps = NULL; |
| } |
| |
| /** |
| * idpf_rxq_sw_queue_rel - Release software queue resources |
| * @rx_qgrp: rx queue group with software queues |
| */ |
| static void idpf_rxq_sw_queue_rel(struct idpf_rxq_group *rx_qgrp) |
| { |
| int i, j; |
| |
| for (i = 0; i < rx_qgrp->vport->num_bufqs_per_qgrp; i++) { |
| struct idpf_bufq_set *bufq_set = &rx_qgrp->splitq.bufq_sets[i]; |
| |
| for (j = 0; j < bufq_set->num_refillqs; j++) { |
| kfree(bufq_set->refillqs[j].ring); |
| bufq_set->refillqs[j].ring = NULL; |
| } |
| kfree(bufq_set->refillqs); |
| bufq_set->refillqs = NULL; |
| } |
| } |
| |
| /** |
| * idpf_rxq_group_rel - Release all resources for rxq groups |
| * @vport: vport to release rxq groups on |
| */ |
| static void idpf_rxq_group_rel(struct idpf_vport *vport) |
| { |
| int i; |
| |
| if (!vport->rxq_grps) |
| return; |
| |
| for (i = 0; i < vport->num_rxq_grp; i++) { |
| struct idpf_rxq_group *rx_qgrp = &vport->rxq_grps[i]; |
| u16 num_rxq; |
| int j; |
| |
| if (idpf_is_queue_model_split(vport->rxq_model)) { |
| num_rxq = rx_qgrp->splitq.num_rxq_sets; |
| for (j = 0; j < num_rxq; j++) { |
| kfree(rx_qgrp->splitq.rxq_sets[j]); |
| rx_qgrp->splitq.rxq_sets[j] = NULL; |
| } |
| |
| idpf_rxq_sw_queue_rel(rx_qgrp); |
| kfree(rx_qgrp->splitq.bufq_sets); |
| rx_qgrp->splitq.bufq_sets = NULL; |
| } else { |
| num_rxq = rx_qgrp->singleq.num_rxq; |
| for (j = 0; j < num_rxq; j++) { |
| kfree(rx_qgrp->singleq.rxqs[j]); |
| rx_qgrp->singleq.rxqs[j] = NULL; |
| } |
| } |
| } |
| kfree(vport->rxq_grps); |
| vport->rxq_grps = NULL; |
| } |
| |
| /** |
| * idpf_vport_queue_grp_rel_all - Release all queue groups |
| * @vport: vport to release queue groups for |
| */ |
| static void idpf_vport_queue_grp_rel_all(struct idpf_vport *vport) |
| { |
| idpf_txq_group_rel(vport); |
| idpf_rxq_group_rel(vport); |
| } |
| |
| /** |
| * idpf_vport_queues_rel - Free memory for all queues |
| * @vport: virtual port |
| * |
| * Free the memory allocated for queues associated to a vport |
| */ |
| void idpf_vport_queues_rel(struct idpf_vport *vport) |
| { |
| idpf_tx_desc_rel_all(vport); |
| idpf_rx_desc_rel_all(vport); |
| idpf_vport_queue_grp_rel_all(vport); |
| |
| kfree(vport->txqs); |
| vport->txqs = NULL; |
| } |
| |
| /** |
| * idpf_vport_init_fast_path_txqs - Initialize fast path txq array |
| * @vport: vport to init txqs on |
| * |
| * We get a queue index from skb->queue_mapping and we need a fast way to |
| * dereference the queue from queue groups. This allows us to quickly pull a |
| * txq based on a queue index. |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_vport_init_fast_path_txqs(struct idpf_vport *vport) |
| { |
| int i, j, k = 0; |
| |
| vport->txqs = kcalloc(vport->num_txq, sizeof(struct idpf_queue *), |
| GFP_KERNEL); |
| |
| if (!vport->txqs) |
| return -ENOMEM; |
| |
| for (i = 0; i < vport->num_txq_grp; i++) { |
| struct idpf_txq_group *tx_grp = &vport->txq_grps[i]; |
| |
| for (j = 0; j < tx_grp->num_txq; j++, k++) { |
| vport->txqs[k] = tx_grp->txqs[j]; |
| vport->txqs[k]->idx = k; |
| } |
| } |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_vport_init_num_qs - Initialize number of queues |
| * @vport: vport to initialize queues |
| * @vport_msg: data to be filled into vport |
| */ |
| void idpf_vport_init_num_qs(struct idpf_vport *vport, |
| struct virtchnl2_create_vport *vport_msg) |
| { |
| struct idpf_vport_user_config_data *config_data; |
| u16 idx = vport->idx; |
| |
| config_data = &vport->adapter->vport_config[idx]->user_config; |
| vport->num_txq = le16_to_cpu(vport_msg->num_tx_q); |
| vport->num_rxq = le16_to_cpu(vport_msg->num_rx_q); |
| /* number of txqs and rxqs in config data will be zeros only in the |
| * driver load path and we dont update them there after |
| */ |
| if (!config_data->num_req_tx_qs && !config_data->num_req_rx_qs) { |
| config_data->num_req_tx_qs = le16_to_cpu(vport_msg->num_tx_q); |
| config_data->num_req_rx_qs = le16_to_cpu(vport_msg->num_rx_q); |
| } |
| |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| vport->num_complq = le16_to_cpu(vport_msg->num_tx_complq); |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| vport->num_bufq = le16_to_cpu(vport_msg->num_rx_bufq); |
| |
| /* Adjust number of buffer queues per Rx queue group. */ |
| if (!idpf_is_queue_model_split(vport->rxq_model)) { |
| vport->num_bufqs_per_qgrp = 0; |
| vport->bufq_size[0] = IDPF_RX_BUF_2048; |
| |
| return; |
| } |
| |
| vport->num_bufqs_per_qgrp = IDPF_MAX_BUFQS_PER_RXQ_GRP; |
| /* Bufq[0] default buffer size is 4K |
| * Bufq[1] default buffer size is 2K |
| */ |
| vport->bufq_size[0] = IDPF_RX_BUF_4096; |
| vport->bufq_size[1] = IDPF_RX_BUF_2048; |
| } |
| |
| /** |
| * idpf_vport_calc_num_q_desc - Calculate number of queue groups |
| * @vport: vport to calculate q groups for |
| */ |
| void idpf_vport_calc_num_q_desc(struct idpf_vport *vport) |
| { |
| struct idpf_vport_user_config_data *config_data; |
| int num_bufqs = vport->num_bufqs_per_qgrp; |
| u32 num_req_txq_desc, num_req_rxq_desc; |
| u16 idx = vport->idx; |
| int i; |
| |
| config_data = &vport->adapter->vport_config[idx]->user_config; |
| num_req_txq_desc = config_data->num_req_txq_desc; |
| num_req_rxq_desc = config_data->num_req_rxq_desc; |
| |
| vport->complq_desc_count = 0; |
| if (num_req_txq_desc) { |
| vport->txq_desc_count = num_req_txq_desc; |
| if (idpf_is_queue_model_split(vport->txq_model)) { |
| vport->complq_desc_count = num_req_txq_desc; |
| if (vport->complq_desc_count < IDPF_MIN_TXQ_COMPLQ_DESC) |
| vport->complq_desc_count = |
| IDPF_MIN_TXQ_COMPLQ_DESC; |
| } |
| } else { |
| vport->txq_desc_count = IDPF_DFLT_TX_Q_DESC_COUNT; |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| vport->complq_desc_count = |
| IDPF_DFLT_TX_COMPLQ_DESC_COUNT; |
| } |
| |
| if (num_req_rxq_desc) |
| vport->rxq_desc_count = num_req_rxq_desc; |
| else |
| vport->rxq_desc_count = IDPF_DFLT_RX_Q_DESC_COUNT; |
| |
| for (i = 0; i < num_bufqs; i++) { |
| if (!vport->bufq_desc_count[i]) |
| vport->bufq_desc_count[i] = |
| IDPF_RX_BUFQ_DESC_COUNT(vport->rxq_desc_count, |
| num_bufqs); |
| } |
| } |
| |
| /** |
| * idpf_vport_calc_total_qs - Calculate total number of queues |
| * @adapter: private data struct |
| * @vport_idx: vport idx to retrieve vport pointer |
| * @vport_msg: message to fill with data |
| * @max_q: vport max queue info |
| * |
| * Return 0 on success, error value on failure. |
| */ |
| int idpf_vport_calc_total_qs(struct idpf_adapter *adapter, u16 vport_idx, |
| struct virtchnl2_create_vport *vport_msg, |
| struct idpf_vport_max_q *max_q) |
| { |
| int dflt_splitq_txq_grps = 0, dflt_singleq_txqs = 0; |
| int dflt_splitq_rxq_grps = 0, dflt_singleq_rxqs = 0; |
| u16 num_req_tx_qs = 0, num_req_rx_qs = 0; |
| struct idpf_vport_config *vport_config; |
| u16 num_txq_grps, num_rxq_grps; |
| u32 num_qs; |
| |
| vport_config = adapter->vport_config[vport_idx]; |
| if (vport_config) { |
| num_req_tx_qs = vport_config->user_config.num_req_tx_qs; |
| num_req_rx_qs = vport_config->user_config.num_req_rx_qs; |
| } else { |
| int num_cpus; |
| |
| /* Restrict num of queues to cpus online as a default |
| * configuration to give best performance. User can always |
| * override to a max number of queues via ethtool. |
| */ |
| num_cpus = num_online_cpus(); |
| |
| dflt_splitq_txq_grps = min_t(int, max_q->max_txq, num_cpus); |
| dflt_singleq_txqs = min_t(int, max_q->max_txq, num_cpus); |
| dflt_splitq_rxq_grps = min_t(int, max_q->max_rxq, num_cpus); |
| dflt_singleq_rxqs = min_t(int, max_q->max_rxq, num_cpus); |
| } |
| |
| if (idpf_is_queue_model_split(le16_to_cpu(vport_msg->txq_model))) { |
| num_txq_grps = num_req_tx_qs ? num_req_tx_qs : dflt_splitq_txq_grps; |
| vport_msg->num_tx_complq = cpu_to_le16(num_txq_grps * |
| IDPF_COMPLQ_PER_GROUP); |
| vport_msg->num_tx_q = cpu_to_le16(num_txq_grps * |
| IDPF_DFLT_SPLITQ_TXQ_PER_GROUP); |
| } else { |
| num_txq_grps = IDPF_DFLT_SINGLEQ_TX_Q_GROUPS; |
| num_qs = num_txq_grps * (num_req_tx_qs ? num_req_tx_qs : |
| dflt_singleq_txqs); |
| vport_msg->num_tx_q = cpu_to_le16(num_qs); |
| vport_msg->num_tx_complq = 0; |
| } |
| if (idpf_is_queue_model_split(le16_to_cpu(vport_msg->rxq_model))) { |
| num_rxq_grps = num_req_rx_qs ? num_req_rx_qs : dflt_splitq_rxq_grps; |
| vport_msg->num_rx_bufq = cpu_to_le16(num_rxq_grps * |
| IDPF_MAX_BUFQS_PER_RXQ_GRP); |
| vport_msg->num_rx_q = cpu_to_le16(num_rxq_grps * |
| IDPF_DFLT_SPLITQ_RXQ_PER_GROUP); |
| } else { |
| num_rxq_grps = IDPF_DFLT_SINGLEQ_RX_Q_GROUPS; |
| num_qs = num_rxq_grps * (num_req_rx_qs ? num_req_rx_qs : |
| dflt_singleq_rxqs); |
| vport_msg->num_rx_q = cpu_to_le16(num_qs); |
| vport_msg->num_rx_bufq = 0; |
| } |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_vport_calc_num_q_groups - Calculate number of queue groups |
| * @vport: vport to calculate q groups for |
| */ |
| void idpf_vport_calc_num_q_groups(struct idpf_vport *vport) |
| { |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| vport->num_txq_grp = vport->num_txq; |
| else |
| vport->num_txq_grp = IDPF_DFLT_SINGLEQ_TX_Q_GROUPS; |
| |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| vport->num_rxq_grp = vport->num_rxq; |
| else |
| vport->num_rxq_grp = IDPF_DFLT_SINGLEQ_RX_Q_GROUPS; |
| } |
| |
| /** |
| * idpf_vport_calc_numq_per_grp - Calculate number of queues per group |
| * @vport: vport to calculate queues for |
| * @num_txq: return parameter for number of TX queues |
| * @num_rxq: return parameter for number of RX queues |
| */ |
| static void idpf_vport_calc_numq_per_grp(struct idpf_vport *vport, |
| u16 *num_txq, u16 *num_rxq) |
| { |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| *num_txq = IDPF_DFLT_SPLITQ_TXQ_PER_GROUP; |
| else |
| *num_txq = vport->num_txq; |
| |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| *num_rxq = IDPF_DFLT_SPLITQ_RXQ_PER_GROUP; |
| else |
| *num_rxq = vport->num_rxq; |
| } |
| |
| /** |
| * idpf_rxq_set_descids - set the descids supported by this queue |
| * @vport: virtual port data structure |
| * @q: rx queue for which descids are set |
| * |
| */ |
| static void idpf_rxq_set_descids(struct idpf_vport *vport, struct idpf_queue *q) |
| { |
| if (vport->rxq_model == VIRTCHNL2_QUEUE_MODEL_SPLIT) { |
| q->rxdids = VIRTCHNL2_RXDID_2_FLEX_SPLITQ_M; |
| } else { |
| if (vport->base_rxd) |
| q->rxdids = VIRTCHNL2_RXDID_1_32B_BASE_M; |
| else |
| q->rxdids = VIRTCHNL2_RXDID_2_FLEX_SQ_NIC_M; |
| } |
| } |
| |
| /** |
| * idpf_txq_group_alloc - Allocate all txq group resources |
| * @vport: vport to allocate txq groups for |
| * @num_txq: number of txqs to allocate for each group |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_txq_group_alloc(struct idpf_vport *vport, u16 num_txq) |
| { |
| bool flow_sch_en; |
| int err, i; |
| |
| vport->txq_grps = kcalloc(vport->num_txq_grp, |
| sizeof(*vport->txq_grps), GFP_KERNEL); |
| if (!vport->txq_grps) |
| return -ENOMEM; |
| |
| flow_sch_en = !idpf_is_cap_ena(vport->adapter, IDPF_OTHER_CAPS, |
| VIRTCHNL2_CAP_SPLITQ_QSCHED); |
| |
| for (i = 0; i < vport->num_txq_grp; i++) { |
| struct idpf_txq_group *tx_qgrp = &vport->txq_grps[i]; |
| struct idpf_adapter *adapter = vport->adapter; |
| int j; |
| |
| tx_qgrp->vport = vport; |
| tx_qgrp->num_txq = num_txq; |
| |
| for (j = 0; j < tx_qgrp->num_txq; j++) { |
| tx_qgrp->txqs[j] = kzalloc(sizeof(*tx_qgrp->txqs[j]), |
| GFP_KERNEL); |
| if (!tx_qgrp->txqs[j]) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| } |
| |
| for (j = 0; j < tx_qgrp->num_txq; j++) { |
| struct idpf_queue *q = tx_qgrp->txqs[j]; |
| |
| q->dev = &adapter->pdev->dev; |
| q->desc_count = vport->txq_desc_count; |
| q->tx_max_bufs = idpf_get_max_tx_bufs(adapter); |
| q->tx_min_pkt_len = idpf_get_min_tx_pkt_len(adapter); |
| q->vport = vport; |
| q->txq_grp = tx_qgrp; |
| hash_init(q->sched_buf_hash); |
| |
| if (flow_sch_en) |
| set_bit(__IDPF_Q_FLOW_SCH_EN, q->flags); |
| } |
| |
| if (!idpf_is_queue_model_split(vport->txq_model)) |
| continue; |
| |
| tx_qgrp->complq = kcalloc(IDPF_COMPLQ_PER_GROUP, |
| sizeof(*tx_qgrp->complq), |
| GFP_KERNEL); |
| if (!tx_qgrp->complq) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| |
| tx_qgrp->complq->dev = &adapter->pdev->dev; |
| tx_qgrp->complq->desc_count = vport->complq_desc_count; |
| tx_qgrp->complq->vport = vport; |
| tx_qgrp->complq->txq_grp = tx_qgrp; |
| |
| if (flow_sch_en) |
| __set_bit(__IDPF_Q_FLOW_SCH_EN, tx_qgrp->complq->flags); |
| } |
| |
| return 0; |
| |
| err_alloc: |
| idpf_txq_group_rel(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_rxq_group_alloc - Allocate all rxq group resources |
| * @vport: vport to allocate rxq groups for |
| * @num_rxq: number of rxqs to allocate for each group |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_rxq_group_alloc(struct idpf_vport *vport, u16 num_rxq) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| struct idpf_queue *q; |
| int i, k, err = 0; |
| bool hs; |
| |
| vport->rxq_grps = kcalloc(vport->num_rxq_grp, |
| sizeof(struct idpf_rxq_group), GFP_KERNEL); |
| if (!vport->rxq_grps) |
| return -ENOMEM; |
| |
| hs = idpf_vport_get_hsplit(vport) == ETHTOOL_TCP_DATA_SPLIT_ENABLED; |
| |
| for (i = 0; i < vport->num_rxq_grp; i++) { |
| struct idpf_rxq_group *rx_qgrp = &vport->rxq_grps[i]; |
| int j; |
| |
| rx_qgrp->vport = vport; |
| if (!idpf_is_queue_model_split(vport->rxq_model)) { |
| rx_qgrp->singleq.num_rxq = num_rxq; |
| for (j = 0; j < num_rxq; j++) { |
| rx_qgrp->singleq.rxqs[j] = |
| kzalloc(sizeof(*rx_qgrp->singleq.rxqs[j]), |
| GFP_KERNEL); |
| if (!rx_qgrp->singleq.rxqs[j]) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| } |
| goto skip_splitq_rx_init; |
| } |
| rx_qgrp->splitq.num_rxq_sets = num_rxq; |
| |
| for (j = 0; j < num_rxq; j++) { |
| rx_qgrp->splitq.rxq_sets[j] = |
| kzalloc(sizeof(struct idpf_rxq_set), |
| GFP_KERNEL); |
| if (!rx_qgrp->splitq.rxq_sets[j]) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| } |
| |
| rx_qgrp->splitq.bufq_sets = kcalloc(vport->num_bufqs_per_qgrp, |
| sizeof(struct idpf_bufq_set), |
| GFP_KERNEL); |
| if (!rx_qgrp->splitq.bufq_sets) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| |
| for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { |
| struct idpf_bufq_set *bufq_set = |
| &rx_qgrp->splitq.bufq_sets[j]; |
| int swq_size = sizeof(struct idpf_sw_queue); |
| |
| q = &rx_qgrp->splitq.bufq_sets[j].bufq; |
| q->dev = &adapter->pdev->dev; |
| q->desc_count = vport->bufq_desc_count[j]; |
| q->vport = vport; |
| q->rxq_grp = rx_qgrp; |
| q->idx = j; |
| q->rx_buf_size = vport->bufq_size[j]; |
| q->rx_buffer_low_watermark = IDPF_LOW_WATERMARK; |
| q->rx_buf_stride = IDPF_RX_BUF_STRIDE; |
| |
| if (hs) { |
| q->rx_hsplit_en = true; |
| q->rx_hbuf_size = IDPF_HDR_BUF_SIZE; |
| } |
| |
| bufq_set->num_refillqs = num_rxq; |
| bufq_set->refillqs = kcalloc(num_rxq, swq_size, |
| GFP_KERNEL); |
| if (!bufq_set->refillqs) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| for (k = 0; k < bufq_set->num_refillqs; k++) { |
| struct idpf_sw_queue *refillq = |
| &bufq_set->refillqs[k]; |
| |
| refillq->dev = &vport->adapter->pdev->dev; |
| refillq->desc_count = |
| vport->bufq_desc_count[j]; |
| set_bit(__IDPF_Q_GEN_CHK, refillq->flags); |
| set_bit(__IDPF_RFLQ_GEN_CHK, refillq->flags); |
| refillq->ring = kcalloc(refillq->desc_count, |
| sizeof(u16), |
| GFP_KERNEL); |
| if (!refillq->ring) { |
| err = -ENOMEM; |
| goto err_alloc; |
| } |
| } |
| } |
| |
| skip_splitq_rx_init: |
| for (j = 0; j < num_rxq; j++) { |
| if (!idpf_is_queue_model_split(vport->rxq_model)) { |
| q = rx_qgrp->singleq.rxqs[j]; |
| goto setup_rxq; |
| } |
| q = &rx_qgrp->splitq.rxq_sets[j]->rxq; |
| rx_qgrp->splitq.rxq_sets[j]->refillq0 = |
| &rx_qgrp->splitq.bufq_sets[0].refillqs[j]; |
| if (vport->num_bufqs_per_qgrp > IDPF_SINGLE_BUFQ_PER_RXQ_GRP) |
| rx_qgrp->splitq.rxq_sets[j]->refillq1 = |
| &rx_qgrp->splitq.bufq_sets[1].refillqs[j]; |
| |
| if (hs) { |
| q->rx_hsplit_en = true; |
| q->rx_hbuf_size = IDPF_HDR_BUF_SIZE; |
| } |
| |
| setup_rxq: |
| q->dev = &adapter->pdev->dev; |
| q->desc_count = vport->rxq_desc_count; |
| q->vport = vport; |
| q->rxq_grp = rx_qgrp; |
| q->idx = (i * num_rxq) + j; |
| /* In splitq mode, RXQ buffer size should be |
| * set to that of the first buffer queue |
| * associated with this RXQ |
| */ |
| q->rx_buf_size = vport->bufq_size[0]; |
| q->rx_buffer_low_watermark = IDPF_LOW_WATERMARK; |
| q->rx_max_pkt_size = vport->netdev->mtu + |
| IDPF_PACKET_HDR_PAD; |
| idpf_rxq_set_descids(vport, q); |
| } |
| } |
| |
| err_alloc: |
| if (err) |
| idpf_rxq_group_rel(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_vport_queue_grp_alloc_all - Allocate all queue groups/resources |
| * @vport: vport with qgrps to allocate |
| * |
| * Returns 0 on success, negative on failure |
| */ |
| static int idpf_vport_queue_grp_alloc_all(struct idpf_vport *vport) |
| { |
| u16 num_txq, num_rxq; |
| int err; |
| |
| idpf_vport_calc_numq_per_grp(vport, &num_txq, &num_rxq); |
| |
| err = idpf_txq_group_alloc(vport, num_txq); |
| if (err) |
| goto err_out; |
| |
| err = idpf_rxq_group_alloc(vport, num_rxq); |
| if (err) |
| goto err_out; |
| |
| return 0; |
| |
| err_out: |
| idpf_vport_queue_grp_rel_all(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_vport_queues_alloc - Allocate memory for all queues |
| * @vport: virtual port |
| * |
| * Allocate memory for queues associated with a vport. Returns 0 on success, |
| * negative on failure. |
| */ |
| int idpf_vport_queues_alloc(struct idpf_vport *vport) |
| { |
| int err; |
| |
| err = idpf_vport_queue_grp_alloc_all(vport); |
| if (err) |
| goto err_out; |
| |
| err = idpf_tx_desc_alloc_all(vport); |
| if (err) |
| goto err_out; |
| |
| err = idpf_rx_desc_alloc_all(vport); |
| if (err) |
| goto err_out; |
| |
| err = idpf_vport_init_fast_path_txqs(vport); |
| if (err) |
| goto err_out; |
| |
| return 0; |
| |
| err_out: |
| idpf_vport_queues_rel(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_tx_handle_sw_marker - Handle queue marker packet |
| * @tx_q: tx queue to handle software marker |
| */ |
| static void idpf_tx_handle_sw_marker(struct idpf_queue *tx_q) |
| { |
| struct idpf_vport *vport = tx_q->vport; |
| int i; |
| |
| clear_bit(__IDPF_Q_SW_MARKER, tx_q->flags); |
| /* Hardware must write marker packets to all queues associated with |
| * completion queues. So check if all queues received marker packets |
| */ |
| for (i = 0; i < vport->num_txq; i++) |
| /* If we're still waiting on any other TXQ marker completions, |
| * just return now since we cannot wake up the marker_wq yet. |
| */ |
| if (test_bit(__IDPF_Q_SW_MARKER, vport->txqs[i]->flags)) |
| return; |
| |
| /* Drain complete */ |
| set_bit(IDPF_VPORT_SW_MARKER, vport->flags); |
| wake_up(&vport->sw_marker_wq); |
| } |
| |
| /** |
| * idpf_tx_splitq_clean_hdr - Clean TX buffer resources for header portion of |
| * packet |
| * @tx_q: tx queue to clean buffer from |
| * @tx_buf: buffer to be cleaned |
| * @cleaned: pointer to stats struct to track cleaned packets/bytes |
| * @napi_budget: Used to determine if we are in netpoll |
| */ |
| static void idpf_tx_splitq_clean_hdr(struct idpf_queue *tx_q, |
| struct idpf_tx_buf *tx_buf, |
| struct idpf_cleaned_stats *cleaned, |
| int napi_budget) |
| { |
| napi_consume_skb(tx_buf->skb, napi_budget); |
| |
| if (dma_unmap_len(tx_buf, len)) { |
| dma_unmap_single(tx_q->dev, |
| dma_unmap_addr(tx_buf, dma), |
| dma_unmap_len(tx_buf, len), |
| DMA_TO_DEVICE); |
| |
| dma_unmap_len_set(tx_buf, len, 0); |
| } |
| |
| /* clear tx_buf data */ |
| tx_buf->skb = NULL; |
| |
| cleaned->bytes += tx_buf->bytecount; |
| cleaned->packets += tx_buf->gso_segs; |
| } |
| |
| /** |
| * idpf_tx_clean_stashed_bufs - clean bufs that were stored for |
| * out of order completions |
| * @txq: queue to clean |
| * @compl_tag: completion tag of packet to clean (from completion descriptor) |
| * @cleaned: pointer to stats struct to track cleaned packets/bytes |
| * @budget: Used to determine if we are in netpoll |
| */ |
| static void idpf_tx_clean_stashed_bufs(struct idpf_queue *txq, u16 compl_tag, |
| struct idpf_cleaned_stats *cleaned, |
| int budget) |
| { |
| struct idpf_tx_stash *stash; |
| struct hlist_node *tmp_buf; |
| |
| /* Buffer completion */ |
| hash_for_each_possible_safe(txq->sched_buf_hash, stash, tmp_buf, |
| hlist, compl_tag) { |
| if (unlikely(stash->buf.compl_tag != (int)compl_tag)) |
| continue; |
| |
| if (stash->buf.skb) { |
| idpf_tx_splitq_clean_hdr(txq, &stash->buf, cleaned, |
| budget); |
| } else if (dma_unmap_len(&stash->buf, len)) { |
| dma_unmap_page(txq->dev, |
| dma_unmap_addr(&stash->buf, dma), |
| dma_unmap_len(&stash->buf, len), |
| DMA_TO_DEVICE); |
| dma_unmap_len_set(&stash->buf, len, 0); |
| } |
| |
| /* Push shadow buf back onto stack */ |
| idpf_buf_lifo_push(&txq->buf_stack, stash); |
| |
| hash_del(&stash->hlist); |
| } |
| } |
| |
| /** |
| * idpf_stash_flow_sch_buffers - store buffer parameters info to be freed at a |
| * later time (only relevant for flow scheduling mode) |
| * @txq: Tx queue to clean |
| * @tx_buf: buffer to store |
| */ |
| static int idpf_stash_flow_sch_buffers(struct idpf_queue *txq, |
| struct idpf_tx_buf *tx_buf) |
| { |
| struct idpf_tx_stash *stash; |
| |
| if (unlikely(!dma_unmap_addr(tx_buf, dma) && |
| !dma_unmap_len(tx_buf, len))) |
| return 0; |
| |
| stash = idpf_buf_lifo_pop(&txq->buf_stack); |
| if (unlikely(!stash)) { |
| net_err_ratelimited("%s: No out-of-order TX buffers left!\n", |
| txq->vport->netdev->name); |
| |
| return -ENOMEM; |
| } |
| |
| /* Store buffer params in shadow buffer */ |
| stash->buf.skb = tx_buf->skb; |
| stash->buf.bytecount = tx_buf->bytecount; |
| stash->buf.gso_segs = tx_buf->gso_segs; |
| dma_unmap_addr_set(&stash->buf, dma, dma_unmap_addr(tx_buf, dma)); |
| dma_unmap_len_set(&stash->buf, len, dma_unmap_len(tx_buf, len)); |
| stash->buf.compl_tag = tx_buf->compl_tag; |
| |
| /* Add buffer to buf_hash table to be freed later */ |
| hash_add(txq->sched_buf_hash, &stash->hlist, stash->buf.compl_tag); |
| |
| memset(tx_buf, 0, sizeof(struct idpf_tx_buf)); |
| |
| /* Reinitialize buf_id portion of tag */ |
| tx_buf->compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; |
| |
| return 0; |
| } |
| |
| #define idpf_tx_splitq_clean_bump_ntc(txq, ntc, desc, buf) \ |
| do { \ |
| (ntc)++; \ |
| if (unlikely(!(ntc))) { \ |
| ntc -= (txq)->desc_count; \ |
| buf = (txq)->tx_buf; \ |
| desc = IDPF_FLEX_TX_DESC(txq, 0); \ |
| } else { \ |
| (buf)++; \ |
| (desc)++; \ |
| } \ |
| } while (0) |
| |
| /** |
| * idpf_tx_splitq_clean - Reclaim resources from buffer queue |
| * @tx_q: Tx queue to clean |
| * @end: queue index until which it should be cleaned |
| * @napi_budget: Used to determine if we are in netpoll |
| * @cleaned: pointer to stats struct to track cleaned packets/bytes |
| * @descs_only: true if queue is using flow-based scheduling and should |
| * not clean buffers at this time |
| * |
| * Cleans the queue descriptor ring. If the queue is using queue-based |
| * scheduling, the buffers will be cleaned as well. If the queue is using |
| * flow-based scheduling, only the descriptors are cleaned at this time. |
| * Separate packet completion events will be reported on the completion queue, |
| * and the buffers will be cleaned separately. The stats are not updated from |
| * this function when using flow-based scheduling. |
| */ |
| static void idpf_tx_splitq_clean(struct idpf_queue *tx_q, u16 end, |
| int napi_budget, |
| struct idpf_cleaned_stats *cleaned, |
| bool descs_only) |
| { |
| union idpf_tx_flex_desc *next_pending_desc = NULL; |
| union idpf_tx_flex_desc *tx_desc; |
| s16 ntc = tx_q->next_to_clean; |
| struct idpf_tx_buf *tx_buf; |
| |
| tx_desc = IDPF_FLEX_TX_DESC(tx_q, ntc); |
| next_pending_desc = IDPF_FLEX_TX_DESC(tx_q, end); |
| tx_buf = &tx_q->tx_buf[ntc]; |
| ntc -= tx_q->desc_count; |
| |
| while (tx_desc != next_pending_desc) { |
| union idpf_tx_flex_desc *eop_desc; |
| |
| /* If this entry in the ring was used as a context descriptor, |
| * it's corresponding entry in the buffer ring will have an |
| * invalid completion tag since no buffer was used. We can |
| * skip this descriptor since there is no buffer to clean. |
| */ |
| if (unlikely(tx_buf->compl_tag == IDPF_SPLITQ_TX_INVAL_COMPL_TAG)) |
| goto fetch_next_txq_desc; |
| |
| eop_desc = (union idpf_tx_flex_desc *)tx_buf->next_to_watch; |
| |
| /* clear next_to_watch to prevent false hangs */ |
| tx_buf->next_to_watch = NULL; |
| |
| if (descs_only) { |
| if (idpf_stash_flow_sch_buffers(tx_q, tx_buf)) |
| goto tx_splitq_clean_out; |
| |
| while (tx_desc != eop_desc) { |
| idpf_tx_splitq_clean_bump_ntc(tx_q, ntc, |
| tx_desc, tx_buf); |
| |
| if (dma_unmap_len(tx_buf, len)) { |
| if (idpf_stash_flow_sch_buffers(tx_q, |
| tx_buf)) |
| goto tx_splitq_clean_out; |
| } |
| } |
| } else { |
| idpf_tx_splitq_clean_hdr(tx_q, tx_buf, cleaned, |
| napi_budget); |
| |
| /* unmap remaining buffers */ |
| while (tx_desc != eop_desc) { |
| idpf_tx_splitq_clean_bump_ntc(tx_q, ntc, |
| tx_desc, tx_buf); |
| |
| /* unmap any remaining paged data */ |
| if (dma_unmap_len(tx_buf, len)) { |
| dma_unmap_page(tx_q->dev, |
| dma_unmap_addr(tx_buf, dma), |
| dma_unmap_len(tx_buf, len), |
| DMA_TO_DEVICE); |
| dma_unmap_len_set(tx_buf, len, 0); |
| } |
| } |
| } |
| |
| fetch_next_txq_desc: |
| idpf_tx_splitq_clean_bump_ntc(tx_q, ntc, tx_desc, tx_buf); |
| } |
| |
| tx_splitq_clean_out: |
| ntc += tx_q->desc_count; |
| tx_q->next_to_clean = ntc; |
| } |
| |
| #define idpf_tx_clean_buf_ring_bump_ntc(txq, ntc, buf) \ |
| do { \ |
| (buf)++; \ |
| (ntc)++; \ |
| if (unlikely((ntc) == (txq)->desc_count)) { \ |
| buf = (txq)->tx_buf; \ |
| ntc = 0; \ |
| } \ |
| } while (0) |
| |
| /** |
| * idpf_tx_clean_buf_ring - clean flow scheduling TX queue buffers |
| * @txq: queue to clean |
| * @compl_tag: completion tag of packet to clean (from completion descriptor) |
| * @cleaned: pointer to stats struct to track cleaned packets/bytes |
| * @budget: Used to determine if we are in netpoll |
| * |
| * Cleans all buffers associated with the input completion tag either from the |
| * TX buffer ring or from the hash table if the buffers were previously |
| * stashed. Returns the byte/segment count for the cleaned packet associated |
| * this completion tag. |
| */ |
| static bool idpf_tx_clean_buf_ring(struct idpf_queue *txq, u16 compl_tag, |
| struct idpf_cleaned_stats *cleaned, |
| int budget) |
| { |
| u16 idx = compl_tag & txq->compl_tag_bufid_m; |
| struct idpf_tx_buf *tx_buf = NULL; |
| u16 ntc = txq->next_to_clean; |
| u16 num_descs_cleaned = 0; |
| u16 orig_idx = idx; |
| |
| tx_buf = &txq->tx_buf[idx]; |
| |
| while (tx_buf->compl_tag == (int)compl_tag) { |
| if (tx_buf->skb) { |
| idpf_tx_splitq_clean_hdr(txq, tx_buf, cleaned, budget); |
| } else if (dma_unmap_len(tx_buf, len)) { |
| dma_unmap_page(txq->dev, |
| dma_unmap_addr(tx_buf, dma), |
| dma_unmap_len(tx_buf, len), |
| DMA_TO_DEVICE); |
| dma_unmap_len_set(tx_buf, len, 0); |
| } |
| |
| memset(tx_buf, 0, sizeof(struct idpf_tx_buf)); |
| tx_buf->compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; |
| |
| num_descs_cleaned++; |
| idpf_tx_clean_buf_ring_bump_ntc(txq, idx, tx_buf); |
| } |
| |
| /* If we didn't clean anything on the ring for this completion, there's |
| * nothing more to do. |
| */ |
| if (unlikely(!num_descs_cleaned)) |
| return false; |
| |
| /* Otherwise, if we did clean a packet on the ring directly, it's safe |
| * to assume that the descriptors starting from the original |
| * next_to_clean up until the previously cleaned packet can be reused. |
| * Therefore, we will go back in the ring and stash any buffers still |
| * in the ring into the hash table to be cleaned later. |
| */ |
| tx_buf = &txq->tx_buf[ntc]; |
| while (tx_buf != &txq->tx_buf[orig_idx]) { |
| idpf_stash_flow_sch_buffers(txq, tx_buf); |
| idpf_tx_clean_buf_ring_bump_ntc(txq, ntc, tx_buf); |
| } |
| |
| /* Finally, update next_to_clean to reflect the work that was just done |
| * on the ring, if any. If the packet was only cleaned from the hash |
| * table, the ring will not be impacted, therefore we should not touch |
| * next_to_clean. The updated idx is used here |
| */ |
| txq->next_to_clean = idx; |
| |
| return true; |
| } |
| |
| /** |
| * idpf_tx_handle_rs_completion - clean a single packet and all of its buffers |
| * whether on the buffer ring or in the hash table |
| * @txq: Tx ring to clean |
| * @desc: pointer to completion queue descriptor to extract completion |
| * information from |
| * @cleaned: pointer to stats struct to track cleaned packets/bytes |
| * @budget: Used to determine if we are in netpoll |
| * |
| * Returns bytes/packets cleaned |
| */ |
| static void idpf_tx_handle_rs_completion(struct idpf_queue *txq, |
| struct idpf_splitq_tx_compl_desc *desc, |
| struct idpf_cleaned_stats *cleaned, |
| int budget) |
| { |
| u16 compl_tag; |
| |
| if (!test_bit(__IDPF_Q_FLOW_SCH_EN, txq->flags)) { |
| u16 head = le16_to_cpu(desc->q_head_compl_tag.q_head); |
| |
| return idpf_tx_splitq_clean(txq, head, budget, cleaned, false); |
| } |
| |
| compl_tag = le16_to_cpu(desc->q_head_compl_tag.compl_tag); |
| |
| /* If we didn't clean anything on the ring, this packet must be |
| * in the hash table. Go clean it there. |
| */ |
| if (!idpf_tx_clean_buf_ring(txq, compl_tag, cleaned, budget)) |
| idpf_tx_clean_stashed_bufs(txq, compl_tag, cleaned, budget); |
| } |
| |
| /** |
| * idpf_tx_clean_complq - Reclaim resources on completion queue |
| * @complq: Tx ring to clean |
| * @budget: Used to determine if we are in netpoll |
| * @cleaned: returns number of packets cleaned |
| * |
| * Returns true if there's any budget left (e.g. the clean is finished) |
| */ |
| static bool idpf_tx_clean_complq(struct idpf_queue *complq, int budget, |
| int *cleaned) |
| { |
| struct idpf_splitq_tx_compl_desc *tx_desc; |
| struct idpf_vport *vport = complq->vport; |
| s16 ntc = complq->next_to_clean; |
| struct idpf_netdev_priv *np; |
| unsigned int complq_budget; |
| bool complq_ok = true; |
| int i; |
| |
| complq_budget = vport->compln_clean_budget; |
| tx_desc = IDPF_SPLITQ_TX_COMPLQ_DESC(complq, ntc); |
| ntc -= complq->desc_count; |
| |
| do { |
| struct idpf_cleaned_stats cleaned_stats = { }; |
| struct idpf_queue *tx_q; |
| int rel_tx_qid; |
| u16 hw_head; |
| u8 ctype; /* completion type */ |
| u16 gen; |
| |
| /* if the descriptor isn't done, no work yet to do */ |
| gen = le16_get_bits(tx_desc->qid_comptype_gen, |
| IDPF_TXD_COMPLQ_GEN_M); |
| if (test_bit(__IDPF_Q_GEN_CHK, complq->flags) != gen) |
| break; |
| |
| /* Find necessary info of TX queue to clean buffers */ |
| rel_tx_qid = le16_get_bits(tx_desc->qid_comptype_gen, |
| IDPF_TXD_COMPLQ_QID_M); |
| if (rel_tx_qid >= complq->txq_grp->num_txq || |
| !complq->txq_grp->txqs[rel_tx_qid]) { |
| dev_err(&complq->vport->adapter->pdev->dev, |
| "TxQ not found\n"); |
| goto fetch_next_desc; |
| } |
| tx_q = complq->txq_grp->txqs[rel_tx_qid]; |
| |
| /* Determine completion type */ |
| ctype = le16_get_bits(tx_desc->qid_comptype_gen, |
| IDPF_TXD_COMPLQ_COMPL_TYPE_M); |
| switch (ctype) { |
| case IDPF_TXD_COMPLT_RE: |
| hw_head = le16_to_cpu(tx_desc->q_head_compl_tag.q_head); |
| |
| idpf_tx_splitq_clean(tx_q, hw_head, budget, |
| &cleaned_stats, true); |
| break; |
| case IDPF_TXD_COMPLT_RS: |
| idpf_tx_handle_rs_completion(tx_q, tx_desc, |
| &cleaned_stats, budget); |
| break; |
| case IDPF_TXD_COMPLT_SW_MARKER: |
| idpf_tx_handle_sw_marker(tx_q); |
| break; |
| default: |
| dev_err(&tx_q->vport->adapter->pdev->dev, |
| "Unknown TX completion type: %d\n", |
| ctype); |
| goto fetch_next_desc; |
| } |
| |
| u64_stats_update_begin(&tx_q->stats_sync); |
| u64_stats_add(&tx_q->q_stats.tx.packets, cleaned_stats.packets); |
| u64_stats_add(&tx_q->q_stats.tx.bytes, cleaned_stats.bytes); |
| tx_q->cleaned_pkts += cleaned_stats.packets; |
| tx_q->cleaned_bytes += cleaned_stats.bytes; |
| complq->num_completions++; |
| u64_stats_update_end(&tx_q->stats_sync); |
| |
| fetch_next_desc: |
| tx_desc++; |
| ntc++; |
| if (unlikely(!ntc)) { |
| ntc -= complq->desc_count; |
| tx_desc = IDPF_SPLITQ_TX_COMPLQ_DESC(complq, 0); |
| change_bit(__IDPF_Q_GEN_CHK, complq->flags); |
| } |
| |
| prefetch(tx_desc); |
| |
| /* update budget accounting */ |
| complq_budget--; |
| } while (likely(complq_budget)); |
| |
| /* Store the state of the complq to be used later in deciding if a |
| * TXQ can be started again |
| */ |
| if (unlikely(IDPF_TX_COMPLQ_PENDING(complq->txq_grp) > |
| IDPF_TX_COMPLQ_OVERFLOW_THRESH(complq))) |
| complq_ok = false; |
| |
| np = netdev_priv(complq->vport->netdev); |
| for (i = 0; i < complq->txq_grp->num_txq; ++i) { |
| struct idpf_queue *tx_q = complq->txq_grp->txqs[i]; |
| struct netdev_queue *nq; |
| bool dont_wake; |
| |
| /* We didn't clean anything on this queue, move along */ |
| if (!tx_q->cleaned_bytes) |
| continue; |
| |
| *cleaned += tx_q->cleaned_pkts; |
| |
| /* Update BQL */ |
| nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); |
| |
| dont_wake = !complq_ok || IDPF_TX_BUF_RSV_LOW(tx_q) || |
| np->state != __IDPF_VPORT_UP || |
| !netif_carrier_ok(tx_q->vport->netdev); |
| /* Check if the TXQ needs to and can be restarted */ |
| __netif_txq_completed_wake(nq, tx_q->cleaned_pkts, tx_q->cleaned_bytes, |
| IDPF_DESC_UNUSED(tx_q), IDPF_TX_WAKE_THRESH, |
| dont_wake); |
| |
| /* Reset cleaned stats for the next time this queue is |
| * cleaned |
| */ |
| tx_q->cleaned_bytes = 0; |
| tx_q->cleaned_pkts = 0; |
| } |
| |
| ntc += complq->desc_count; |
| complq->next_to_clean = ntc; |
| |
| return !!complq_budget; |
| } |
| |
| /** |
| * idpf_tx_splitq_build_ctb - populate command tag and size for queue |
| * based scheduling descriptors |
| * @desc: descriptor to populate |
| * @params: pointer to tx params struct |
| * @td_cmd: command to be filled in desc |
| * @size: size of buffer |
| */ |
| void idpf_tx_splitq_build_ctb(union idpf_tx_flex_desc *desc, |
| struct idpf_tx_splitq_params *params, |
| u16 td_cmd, u16 size) |
| { |
| desc->q.qw1.cmd_dtype = |
| le16_encode_bits(params->dtype, IDPF_FLEX_TXD_QW1_DTYPE_M); |
| desc->q.qw1.cmd_dtype |= |
| le16_encode_bits(td_cmd, IDPF_FLEX_TXD_QW1_CMD_M); |
| desc->q.qw1.buf_size = cpu_to_le16(size); |
| desc->q.qw1.l2tags.l2tag1 = cpu_to_le16(params->td_tag); |
| } |
| |
| /** |
| * idpf_tx_splitq_build_flow_desc - populate command tag and size for flow |
| * scheduling descriptors |
| * @desc: descriptor to populate |
| * @params: pointer to tx params struct |
| * @td_cmd: command to be filled in desc |
| * @size: size of buffer |
| */ |
| void idpf_tx_splitq_build_flow_desc(union idpf_tx_flex_desc *desc, |
| struct idpf_tx_splitq_params *params, |
| u16 td_cmd, u16 size) |
| { |
| desc->flow.qw1.cmd_dtype = (u16)params->dtype | td_cmd; |
| desc->flow.qw1.rxr_bufsize = cpu_to_le16((u16)size); |
| desc->flow.qw1.compl_tag = cpu_to_le16(params->compl_tag); |
| } |
| |
| /** |
| * idpf_tx_maybe_stop_common - 1st level check for common Tx stop conditions |
| * @tx_q: the queue to be checked |
| * @size: number of descriptors we want to assure is available |
| * |
| * Returns 0 if stop is not needed |
| */ |
| int idpf_tx_maybe_stop_common(struct idpf_queue *tx_q, unsigned int size) |
| { |
| struct netdev_queue *nq; |
| |
| if (likely(IDPF_DESC_UNUSED(tx_q) >= size)) |
| return 0; |
| |
| u64_stats_update_begin(&tx_q->stats_sync); |
| u64_stats_inc(&tx_q->q_stats.tx.q_busy); |
| u64_stats_update_end(&tx_q->stats_sync); |
| |
| nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); |
| |
| return netif_txq_maybe_stop(nq, IDPF_DESC_UNUSED(tx_q), size, size); |
| } |
| |
| /** |
| * idpf_tx_maybe_stop_splitq - 1st level check for Tx splitq stop conditions |
| * @tx_q: the queue to be checked |
| * @descs_needed: number of descriptors required for this packet |
| * |
| * Returns 0 if stop is not needed |
| */ |
| static int idpf_tx_maybe_stop_splitq(struct idpf_queue *tx_q, |
| unsigned int descs_needed) |
| { |
| if (idpf_tx_maybe_stop_common(tx_q, descs_needed)) |
| goto splitq_stop; |
| |
| /* If there are too many outstanding completions expected on the |
| * completion queue, stop the TX queue to give the device some time to |
| * catch up |
| */ |
| if (unlikely(IDPF_TX_COMPLQ_PENDING(tx_q->txq_grp) > |
| IDPF_TX_COMPLQ_OVERFLOW_THRESH(tx_q->txq_grp->complq))) |
| goto splitq_stop; |
| |
| /* Also check for available book keeping buffers; if we are low, stop |
| * the queue to wait for more completions |
| */ |
| if (unlikely(IDPF_TX_BUF_RSV_LOW(tx_q))) |
| goto splitq_stop; |
| |
| return 0; |
| |
| splitq_stop: |
| u64_stats_update_begin(&tx_q->stats_sync); |
| u64_stats_inc(&tx_q->q_stats.tx.q_busy); |
| u64_stats_update_end(&tx_q->stats_sync); |
| netif_stop_subqueue(tx_q->vport->netdev, tx_q->idx); |
| |
| return -EBUSY; |
| } |
| |
| /** |
| * idpf_tx_buf_hw_update - Store the new tail value |
| * @tx_q: queue to bump |
| * @val: new tail index |
| * @xmit_more: more skb's pending |
| * |
| * The naming here is special in that 'hw' signals that this function is about |
| * to do a register write to update our queue status. We know this can only |
| * mean tail here as HW should be owning head for TX. |
| */ |
| void idpf_tx_buf_hw_update(struct idpf_queue *tx_q, u32 val, |
| bool xmit_more) |
| { |
| struct netdev_queue *nq; |
| |
| nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); |
| tx_q->next_to_use = val; |
| |
| idpf_tx_maybe_stop_common(tx_q, IDPF_TX_DESC_NEEDED); |
| |
| /* Force memory writes to complete before letting h/w |
| * know there are new descriptors to fetch. (Only |
| * applicable for weak-ordered memory model archs, |
| * such as IA-64). |
| */ |
| wmb(); |
| |
| /* notify HW of packet */ |
| if (netif_xmit_stopped(nq) || !xmit_more) |
| writel(val, tx_q->tail); |
| } |
| |
| /** |
| * idpf_tx_desc_count_required - calculate number of Tx descriptors needed |
| * @txq: queue to send buffer on |
| * @skb: send buffer |
| * |
| * Returns number of data descriptors needed for this skb. |
| */ |
| unsigned int idpf_tx_desc_count_required(struct idpf_queue *txq, |
| struct sk_buff *skb) |
| { |
| const struct skb_shared_info *shinfo; |
| unsigned int count = 0, i; |
| |
| count += !!skb_headlen(skb); |
| |
| if (!skb_is_nonlinear(skb)) |
| return count; |
| |
| shinfo = skb_shinfo(skb); |
| for (i = 0; i < shinfo->nr_frags; i++) { |
| unsigned int size; |
| |
| size = skb_frag_size(&shinfo->frags[i]); |
| |
| /* We only need to use the idpf_size_to_txd_count check if the |
| * fragment is going to span multiple descriptors, |
| * i.e. size >= 16K. |
| */ |
| if (size >= SZ_16K) |
| count += idpf_size_to_txd_count(size); |
| else |
| count++; |
| } |
| |
| if (idpf_chk_linearize(skb, txq->tx_max_bufs, count)) { |
| if (__skb_linearize(skb)) |
| return 0; |
| |
| count = idpf_size_to_txd_count(skb->len); |
| u64_stats_update_begin(&txq->stats_sync); |
| u64_stats_inc(&txq->q_stats.tx.linearize); |
| u64_stats_update_end(&txq->stats_sync); |
| } |
| |
| return count; |
| } |
| |
| /** |
| * idpf_tx_dma_map_error - handle TX DMA map errors |
| * @txq: queue to send buffer on |
| * @skb: send buffer |
| * @first: original first buffer info buffer for packet |
| * @idx: starting point on ring to unwind |
| */ |
| void idpf_tx_dma_map_error(struct idpf_queue *txq, struct sk_buff *skb, |
| struct idpf_tx_buf *first, u16 idx) |
| { |
| u64_stats_update_begin(&txq->stats_sync); |
| u64_stats_inc(&txq->q_stats.tx.dma_map_errs); |
| u64_stats_update_end(&txq->stats_sync); |
| |
| /* clear dma mappings for failed tx_buf map */ |
| for (;;) { |
| struct idpf_tx_buf *tx_buf; |
| |
| tx_buf = &txq->tx_buf[idx]; |
| idpf_tx_buf_rel(txq, tx_buf); |
| if (tx_buf == first) |
| break; |
| if (idx == 0) |
| idx = txq->desc_count; |
| idx--; |
| } |
| |
| if (skb_is_gso(skb)) { |
| union idpf_tx_flex_desc *tx_desc; |
| |
| /* If we failed a DMA mapping for a TSO packet, we will have |
| * used one additional descriptor for a context |
| * descriptor. Reset that here. |
| */ |
| tx_desc = IDPF_FLEX_TX_DESC(txq, idx); |
| memset(tx_desc, 0, sizeof(struct idpf_flex_tx_ctx_desc)); |
| if (idx == 0) |
| idx = txq->desc_count; |
| idx--; |
| } |
| |
| /* Update tail in case netdev_xmit_more was previously true */ |
| idpf_tx_buf_hw_update(txq, idx, false); |
| } |
| |
| /** |
| * idpf_tx_splitq_bump_ntu - adjust NTU and generation |
| * @txq: the tx ring to wrap |
| * @ntu: ring index to bump |
| */ |
| static unsigned int idpf_tx_splitq_bump_ntu(struct idpf_queue *txq, u16 ntu) |
| { |
| ntu++; |
| |
| if (ntu == txq->desc_count) { |
| ntu = 0; |
| txq->compl_tag_cur_gen = IDPF_TX_ADJ_COMPL_TAG_GEN(txq); |
| } |
| |
| return ntu; |
| } |
| |
| /** |
| * idpf_tx_splitq_map - Build the Tx flex descriptor |
| * @tx_q: queue to send buffer on |
| * @params: pointer to splitq params struct |
| * @first: first buffer info buffer to use |
| * |
| * This function loops over the skb data pointed to by *first |
| * and gets a physical address for each memory location and programs |
| * it and the length into the transmit flex descriptor. |
| */ |
| static void idpf_tx_splitq_map(struct idpf_queue *tx_q, |
| struct idpf_tx_splitq_params *params, |
| struct idpf_tx_buf *first) |
| { |
| union idpf_tx_flex_desc *tx_desc; |
| unsigned int data_len, size; |
| struct idpf_tx_buf *tx_buf; |
| u16 i = tx_q->next_to_use; |
| struct netdev_queue *nq; |
| struct sk_buff *skb; |
| skb_frag_t *frag; |
| u16 td_cmd = 0; |
| dma_addr_t dma; |
| |
| skb = first->skb; |
| |
| td_cmd = params->offload.td_cmd; |
| |
| data_len = skb->data_len; |
| size = skb_headlen(skb); |
| |
| tx_desc = IDPF_FLEX_TX_DESC(tx_q, i); |
| |
| dma = dma_map_single(tx_q->dev, skb->data, size, DMA_TO_DEVICE); |
| |
| tx_buf = first; |
| |
| params->compl_tag = |
| (tx_q->compl_tag_cur_gen << tx_q->compl_tag_gen_s) | i; |
| |
| for (frag = &skb_shinfo(skb)->frags[0];; frag++) { |
| unsigned int max_data = IDPF_TX_MAX_DESC_DATA_ALIGNED; |
| |
| if (dma_mapping_error(tx_q->dev, dma)) |
| return idpf_tx_dma_map_error(tx_q, skb, first, i); |
| |
| tx_buf->compl_tag = params->compl_tag; |
| |
| /* record length, and DMA address */ |
| dma_unmap_len_set(tx_buf, len, size); |
| dma_unmap_addr_set(tx_buf, dma, dma); |
| |
| /* buf_addr is in same location for both desc types */ |
| tx_desc->q.buf_addr = cpu_to_le64(dma); |
| |
| /* The stack can send us fragments that are too large for a |
| * single descriptor i.e. frag size > 16K-1. We will need to |
| * split the fragment across multiple descriptors in this case. |
| * To adhere to HW alignment restrictions, the fragment needs |
| * to be split such that the first chunk ends on a 4K boundary |
| * and all subsequent chunks start on a 4K boundary. We still |
| * want to send as much data as possible though, so our |
| * intermediate descriptor chunk size will be 12K. |
| * |
| * For example, consider a 32K fragment mapped to DMA addr 2600. |
| * ------------------------------------------------------------ |
| * | frag_size = 32K | |
| * ------------------------------------------------------------ |
| * |2600 |16384 |28672 |
| * |
| * 3 descriptors will be used for this fragment. The HW expects |
| * the descriptors to contain the following: |
| * ------------------------------------------------------------ |
| * | size = 13784 | size = 12K | size = 6696 | |
| * | dma = 2600 | dma = 16384 | dma = 28672 | |
| * ------------------------------------------------------------ |
| * |
| * We need to first adjust the max_data for the first chunk so |
| * that it ends on a 4K boundary. By negating the value of the |
| * DMA address and taking only the low order bits, we're |
| * effectively calculating |
| * 4K - (DMA addr lower order bits) = |
| * bytes to next boundary. |
| * |
| * Add that to our base aligned max_data (12K) and we have |
| * our first chunk size. In the example above, |
| * 13784 = 12K + (4096-2600) |
| * |
| * After guaranteeing the first chunk ends on a 4K boundary, we |
| * will give the intermediate descriptors 12K chunks and |
| * whatever is left to the final descriptor. This ensures that |
| * all descriptors used for the remaining chunks of the |
| * fragment start on a 4K boundary and we use as few |
| * descriptors as possible. |
| */ |
| max_data += -dma & (IDPF_TX_MAX_READ_REQ_SIZE - 1); |
| while (unlikely(size > IDPF_TX_MAX_DESC_DATA)) { |
| idpf_tx_splitq_build_desc(tx_desc, params, td_cmd, |
| max_data); |
| |
| tx_desc++; |
| i++; |
| |
| if (i == tx_q->desc_count) { |
| tx_desc = IDPF_FLEX_TX_DESC(tx_q, 0); |
| i = 0; |
| tx_q->compl_tag_cur_gen = |
| IDPF_TX_ADJ_COMPL_TAG_GEN(tx_q); |
| } |
| |
| /* Since this packet has a buffer that is going to span |
| * multiple descriptors, it's going to leave holes in |
| * to the TX buffer ring. To ensure these holes do not |
| * cause issues in the cleaning routines, we will clear |
| * them of any stale data and assign them the same |
| * completion tag as the current packet. Then when the |
| * packet is being cleaned, the cleaning routines will |
| * simply pass over these holes and finish cleaning the |
| * rest of the packet. |
| */ |
| memset(&tx_q->tx_buf[i], 0, sizeof(struct idpf_tx_buf)); |
| tx_q->tx_buf[i].compl_tag = params->compl_tag; |
| |
| /* Adjust the DMA offset and the remaining size of the |
| * fragment. On the first iteration of this loop, |
| * max_data will be >= 12K and <= 16K-1. On any |
| * subsequent iteration of this loop, max_data will |
| * always be 12K. |
| */ |
| dma += max_data; |
| size -= max_data; |
| |
| /* Reset max_data since remaining chunks will be 12K |
| * at most |
| */ |
| max_data = IDPF_TX_MAX_DESC_DATA_ALIGNED; |
| |
| /* buf_addr is in same location for both desc types */ |
| tx_desc->q.buf_addr = cpu_to_le64(dma); |
| } |
| |
| if (!data_len) |
| break; |
| |
| idpf_tx_splitq_build_desc(tx_desc, params, td_cmd, size); |
| tx_desc++; |
| i++; |
| |
| if (i == tx_q->desc_count) { |
| tx_desc = IDPF_FLEX_TX_DESC(tx_q, 0); |
| i = 0; |
| tx_q->compl_tag_cur_gen = IDPF_TX_ADJ_COMPL_TAG_GEN(tx_q); |
| } |
| |
| size = skb_frag_size(frag); |
| data_len -= size; |
| |
| dma = skb_frag_dma_map(tx_q->dev, frag, 0, size, |
| DMA_TO_DEVICE); |
| |
| tx_buf = &tx_q->tx_buf[i]; |
| } |
| |
| /* record SW timestamp if HW timestamp is not available */ |
| skb_tx_timestamp(skb); |
| |
| /* write last descriptor with RS and EOP bits */ |
| td_cmd |= params->eop_cmd; |
| idpf_tx_splitq_build_desc(tx_desc, params, td_cmd, size); |
| i = idpf_tx_splitq_bump_ntu(tx_q, i); |
| |
| /* set next_to_watch value indicating a packet is present */ |
| first->next_to_watch = tx_desc; |
| |
| tx_q->txq_grp->num_completions_pending++; |
| |
| /* record bytecount for BQL */ |
| nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); |
| netdev_tx_sent_queue(nq, first->bytecount); |
| |
| idpf_tx_buf_hw_update(tx_q, i, netdev_xmit_more()); |
| } |
| |
| /** |
| * idpf_tso - computes mss and TSO length to prepare for TSO |
| * @skb: pointer to skb |
| * @off: pointer to struct that holds offload parameters |
| * |
| * Returns error (negative) if TSO was requested but cannot be applied to the |
| * given skb, 0 if TSO does not apply to the given skb, or 1 otherwise. |
| */ |
| int idpf_tso(struct sk_buff *skb, struct idpf_tx_offload_params *off) |
| { |
| const struct skb_shared_info *shinfo; |
| union { |
| struct iphdr *v4; |
| struct ipv6hdr *v6; |
| unsigned char *hdr; |
| } ip; |
| union { |
| struct tcphdr *tcp; |
| struct udphdr *udp; |
| unsigned char *hdr; |
| } l4; |
| u32 paylen, l4_start; |
| int err; |
| |
| if (!skb_is_gso(skb)) |
| return 0; |
| |
| err = skb_cow_head(skb, 0); |
| if (err < 0) |
| return err; |
| |
| shinfo = skb_shinfo(skb); |
| |
| ip.hdr = skb_network_header(skb); |
| l4.hdr = skb_transport_header(skb); |
| |
| /* initialize outer IP header fields */ |
| if (ip.v4->version == 4) { |
| ip.v4->tot_len = 0; |
| ip.v4->check = 0; |
| } else if (ip.v6->version == 6) { |
| ip.v6->payload_len = 0; |
| } |
| |
| l4_start = skb_transport_offset(skb); |
| |
| /* remove payload length from checksum */ |
| paylen = skb->len - l4_start; |
| |
| switch (shinfo->gso_type & ~SKB_GSO_DODGY) { |
| case SKB_GSO_TCPV4: |
| case SKB_GSO_TCPV6: |
| csum_replace_by_diff(&l4.tcp->check, |
| (__force __wsum)htonl(paylen)); |
| off->tso_hdr_len = __tcp_hdrlen(l4.tcp) + l4_start; |
| break; |
| case SKB_GSO_UDP_L4: |
| csum_replace_by_diff(&l4.udp->check, |
| (__force __wsum)htonl(paylen)); |
| /* compute length of segmentation header */ |
| off->tso_hdr_len = sizeof(struct udphdr) + l4_start; |
| l4.udp->len = htons(shinfo->gso_size + sizeof(struct udphdr)); |
| break; |
| default: |
| return -EINVAL; |
| } |
| |
| off->tso_len = skb->len - off->tso_hdr_len; |
| off->mss = shinfo->gso_size; |
| off->tso_segs = shinfo->gso_segs; |
| |
| off->tx_flags |= IDPF_TX_FLAGS_TSO; |
| |
| return 1; |
| } |
| |
| /** |
| * __idpf_chk_linearize - Check skb is not using too many buffers |
| * @skb: send buffer |
| * @max_bufs: maximum number of buffers |
| * |
| * For TSO we need to count the TSO header and segment payload separately. As |
| * such we need to check cases where we have max_bufs-1 fragments or more as we |
| * can potentially require max_bufs+1 DMA transactions, 1 for the TSO header, 1 |
| * for the segment payload in the first descriptor, and another max_buf-1 for |
| * the fragments. |
| */ |
| static bool __idpf_chk_linearize(struct sk_buff *skb, unsigned int max_bufs) |
| { |
| const struct skb_shared_info *shinfo = skb_shinfo(skb); |
| const skb_frag_t *frag, *stale; |
| int nr_frags, sum; |
| |
| /* no need to check if number of frags is less than max_bufs - 1 */ |
| nr_frags = shinfo->nr_frags; |
| if (nr_frags < (max_bufs - 1)) |
| return false; |
| |
| /* We need to walk through the list and validate that each group |
| * of max_bufs-2 fragments totals at least gso_size. |
| */ |
| nr_frags -= max_bufs - 2; |
| frag = &shinfo->frags[0]; |
| |
| /* Initialize size to the negative value of gso_size minus 1. We use |
| * this as the worst case scenario in which the frag ahead of us only |
| * provides one byte which is why we are limited to max_bufs-2 |
| * descriptors for a single transmit as the header and previous |
| * fragment are already consuming 2 descriptors. |
| */ |
| sum = 1 - shinfo->gso_size; |
| |
| /* Add size of frags 0 through 4 to create our initial sum */ |
| sum += skb_frag_size(frag++); |
| sum += skb_frag_size(frag++); |
| sum += skb_frag_size(frag++); |
| sum += skb_frag_size(frag++); |
| sum += skb_frag_size(frag++); |
| |
| /* Walk through fragments adding latest fragment, testing it, and |
| * then removing stale fragments from the sum. |
| */ |
| for (stale = &shinfo->frags[0];; stale++) { |
| int stale_size = skb_frag_size(stale); |
| |
| sum += skb_frag_size(frag++); |
| |
| /* The stale fragment may present us with a smaller |
| * descriptor than the actual fragment size. To account |
| * for that we need to remove all the data on the front and |
| * figure out what the remainder would be in the last |
| * descriptor associated with the fragment. |
| */ |
| if (stale_size > IDPF_TX_MAX_DESC_DATA) { |
| int align_pad = -(skb_frag_off(stale)) & |
| (IDPF_TX_MAX_READ_REQ_SIZE - 1); |
| |
| sum -= align_pad; |
| stale_size -= align_pad; |
| |
| do { |
| sum -= IDPF_TX_MAX_DESC_DATA_ALIGNED; |
| stale_size -= IDPF_TX_MAX_DESC_DATA_ALIGNED; |
| } while (stale_size > IDPF_TX_MAX_DESC_DATA); |
| } |
| |
| /* if sum is negative we failed to make sufficient progress */ |
| if (sum < 0) |
| return true; |
| |
| if (!nr_frags--) |
| break; |
| |
| sum -= stale_size; |
| } |
| |
| return false; |
| } |
| |
| /** |
| * idpf_chk_linearize - Check if skb exceeds max descriptors per packet |
| * @skb: send buffer |
| * @max_bufs: maximum scatter gather buffers for single packet |
| * @count: number of buffers this packet needs |
| * |
| * Make sure we don't exceed maximum scatter gather buffers for a single |
| * packet. We have to do some special checking around the boundary (max_bufs-1) |
| * if TSO is on since we need count the TSO header and payload separately. |
| * E.g.: a packet with 7 fragments can require 9 DMA transactions; 1 for TSO |
| * header, 1 for segment payload, and then 7 for the fragments. |
| */ |
| bool idpf_chk_linearize(struct sk_buff *skb, unsigned int max_bufs, |
| unsigned int count) |
| { |
| if (likely(count < max_bufs)) |
| return false; |
| if (skb_is_gso(skb)) |
| return __idpf_chk_linearize(skb, max_bufs); |
| |
| return count > max_bufs; |
| } |
| |
| /** |
| * idpf_tx_splitq_get_ctx_desc - grab next desc and update buffer ring |
| * @txq: queue to put context descriptor on |
| * |
| * Since the TX buffer rings mimics the descriptor ring, update the tx buffer |
| * ring entry to reflect that this index is a context descriptor |
| */ |
| static struct idpf_flex_tx_ctx_desc * |
| idpf_tx_splitq_get_ctx_desc(struct idpf_queue *txq) |
| { |
| struct idpf_flex_tx_ctx_desc *desc; |
| int i = txq->next_to_use; |
| |
| memset(&txq->tx_buf[i], 0, sizeof(struct idpf_tx_buf)); |
| txq->tx_buf[i].compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; |
| |
| /* grab the next descriptor */ |
| desc = IDPF_FLEX_TX_CTX_DESC(txq, i); |
| txq->next_to_use = idpf_tx_splitq_bump_ntu(txq, i); |
| |
| return desc; |
| } |
| |
| /** |
| * idpf_tx_drop_skb - free the SKB and bump tail if necessary |
| * @tx_q: queue to send buffer on |
| * @skb: pointer to skb |
| */ |
| netdev_tx_t idpf_tx_drop_skb(struct idpf_queue *tx_q, struct sk_buff *skb) |
| { |
| u64_stats_update_begin(&tx_q->stats_sync); |
| u64_stats_inc(&tx_q->q_stats.tx.skb_drops); |
| u64_stats_update_end(&tx_q->stats_sync); |
| |
| idpf_tx_buf_hw_update(tx_q, tx_q->next_to_use, false); |
| |
| dev_kfree_skb(skb); |
| |
| return NETDEV_TX_OK; |
| } |
| |
| /** |
| * idpf_tx_splitq_frame - Sends buffer on Tx ring using flex descriptors |
| * @skb: send buffer |
| * @tx_q: queue to send buffer on |
| * |
| * Returns NETDEV_TX_OK if sent, else an error code |
| */ |
| static netdev_tx_t idpf_tx_splitq_frame(struct sk_buff *skb, |
| struct idpf_queue *tx_q) |
| { |
| struct idpf_tx_splitq_params tx_params = { }; |
| struct idpf_tx_buf *first; |
| unsigned int count; |
| int tso; |
| |
| count = idpf_tx_desc_count_required(tx_q, skb); |
| if (unlikely(!count)) |
| return idpf_tx_drop_skb(tx_q, skb); |
| |
| tso = idpf_tso(skb, &tx_params.offload); |
| if (unlikely(tso < 0)) |
| return idpf_tx_drop_skb(tx_q, skb); |
| |
| /* Check for splitq specific TX resources */ |
| count += (IDPF_TX_DESCS_PER_CACHE_LINE + tso); |
| if (idpf_tx_maybe_stop_splitq(tx_q, count)) { |
| idpf_tx_buf_hw_update(tx_q, tx_q->next_to_use, false); |
| |
| return NETDEV_TX_BUSY; |
| } |
| |
| if (tso) { |
| /* If tso is needed, set up context desc */ |
| struct idpf_flex_tx_ctx_desc *ctx_desc = |
| idpf_tx_splitq_get_ctx_desc(tx_q); |
| |
| ctx_desc->tso.qw1.cmd_dtype = |
| cpu_to_le16(IDPF_TX_DESC_DTYPE_FLEX_TSO_CTX | |
| IDPF_TX_FLEX_CTX_DESC_CMD_TSO); |
| ctx_desc->tso.qw0.flex_tlen = |
| cpu_to_le32(tx_params.offload.tso_len & |
| IDPF_TXD_FLEX_CTX_TLEN_M); |
| ctx_desc->tso.qw0.mss_rt = |
| cpu_to_le16(tx_params.offload.mss & |
| IDPF_TXD_FLEX_CTX_MSS_RT_M); |
| ctx_desc->tso.qw0.hdr_len = tx_params.offload.tso_hdr_len; |
| |
| u64_stats_update_begin(&tx_q->stats_sync); |
| u64_stats_inc(&tx_q->q_stats.tx.lso_pkts); |
| u64_stats_update_end(&tx_q->stats_sync); |
| } |
| |
| /* record the location of the first descriptor for this packet */ |
| first = &tx_q->tx_buf[tx_q->next_to_use]; |
| first->skb = skb; |
| |
| if (tso) { |
| first->gso_segs = tx_params.offload.tso_segs; |
| first->bytecount = skb->len + |
| ((first->gso_segs - 1) * tx_params.offload.tso_hdr_len); |
| } else { |
| first->gso_segs = 1; |
| first->bytecount = max_t(unsigned int, skb->len, ETH_ZLEN); |
| } |
| |
| if (test_bit(__IDPF_Q_FLOW_SCH_EN, tx_q->flags)) { |
| tx_params.dtype = IDPF_TX_DESC_DTYPE_FLEX_FLOW_SCHE; |
| tx_params.eop_cmd = IDPF_TXD_FLEX_FLOW_CMD_EOP; |
| /* Set the RE bit to catch any packets that may have not been |
| * stashed during RS completion cleaning. MIN_GAP is set to |
| * MIN_RING size to ensure it will be set at least once each |
| * time around the ring. |
| */ |
| if (!(tx_q->next_to_use % IDPF_TX_SPLITQ_RE_MIN_GAP)) { |
| tx_params.eop_cmd |= IDPF_TXD_FLEX_FLOW_CMD_RE; |
| tx_q->txq_grp->num_completions_pending++; |
| } |
| |
| if (skb->ip_summed == CHECKSUM_PARTIAL) |
| tx_params.offload.td_cmd |= IDPF_TXD_FLEX_FLOW_CMD_CS_EN; |
| |
| } else { |
| tx_params.dtype = IDPF_TX_DESC_DTYPE_FLEX_L2TAG1_L2TAG2; |
| tx_params.eop_cmd = IDPF_TXD_LAST_DESC_CMD; |
| |
| if (skb->ip_summed == CHECKSUM_PARTIAL) |
| tx_params.offload.td_cmd |= IDPF_TX_FLEX_DESC_CMD_CS_EN; |
| } |
| |
| idpf_tx_splitq_map(tx_q, &tx_params, first); |
| |
| return NETDEV_TX_OK; |
| } |
| |
| /** |
| * idpf_tx_splitq_start - Selects the right Tx queue to send buffer |
| * @skb: send buffer |
| * @netdev: network interface device structure |
| * |
| * Returns NETDEV_TX_OK if sent, else an error code |
| */ |
| netdev_tx_t idpf_tx_splitq_start(struct sk_buff *skb, |
| struct net_device *netdev) |
| { |
| struct idpf_vport *vport = idpf_netdev_to_vport(netdev); |
| struct idpf_queue *tx_q; |
| |
| if (unlikely(skb_get_queue_mapping(skb) >= vport->num_txq)) { |
| dev_kfree_skb_any(skb); |
| |
| return NETDEV_TX_OK; |
| } |
| |
| tx_q = vport->txqs[skb_get_queue_mapping(skb)]; |
| |
| /* hardware can't handle really short frames, hardware padding works |
| * beyond this point |
| */ |
| if (skb_put_padto(skb, tx_q->tx_min_pkt_len)) { |
| idpf_tx_buf_hw_update(tx_q, tx_q->next_to_use, false); |
| |
| return NETDEV_TX_OK; |
| } |
| |
| return idpf_tx_splitq_frame(skb, tx_q); |
| } |
| |
| /** |
| * idpf_ptype_to_htype - get a hash type |
| * @decoded: Decoded Rx packet type related fields |
| * |
| * Returns appropriate hash type (such as PKT_HASH_TYPE_L2/L3/L4) to be used by |
| * skb_set_hash based on PTYPE as parsed by HW Rx pipeline and is part of |
| * Rx desc. |
| */ |
| enum pkt_hash_types idpf_ptype_to_htype(const struct idpf_rx_ptype_decoded *decoded) |
| { |
| if (!decoded->known) |
| return PKT_HASH_TYPE_NONE; |
| if (decoded->payload_layer == IDPF_RX_PTYPE_PAYLOAD_LAYER_PAY2 && |
| decoded->inner_prot) |
| return PKT_HASH_TYPE_L4; |
| if (decoded->payload_layer == IDPF_RX_PTYPE_PAYLOAD_LAYER_PAY2 && |
| decoded->outer_ip) |
| return PKT_HASH_TYPE_L3; |
| if (decoded->outer_ip == IDPF_RX_PTYPE_OUTER_L2) |
| return PKT_HASH_TYPE_L2; |
| |
| return PKT_HASH_TYPE_NONE; |
| } |
| |
| /** |
| * idpf_rx_hash - set the hash value in the skb |
| * @rxq: Rx descriptor ring packet is being transacted on |
| * @skb: pointer to current skb being populated |
| * @rx_desc: Receive descriptor |
| * @decoded: Decoded Rx packet type related fields |
| */ |
| static void idpf_rx_hash(struct idpf_queue *rxq, struct sk_buff *skb, |
| struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc, |
| struct idpf_rx_ptype_decoded *decoded) |
| { |
| u32 hash; |
| |
| if (unlikely(!idpf_is_feature_ena(rxq->vport, NETIF_F_RXHASH))) |
| return; |
| |
| hash = le16_to_cpu(rx_desc->hash1) | |
| (rx_desc->ff2_mirrid_hash2.hash2 << 16) | |
| (rx_desc->hash3 << 24); |
| |
| skb_set_hash(skb, hash, idpf_ptype_to_htype(decoded)); |
| } |
| |
| /** |
| * idpf_rx_csum - Indicate in skb if checksum is good |
| * @rxq: Rx descriptor ring packet is being transacted on |
| * @skb: pointer to current skb being populated |
| * @csum_bits: checksum fields extracted from the descriptor |
| * @decoded: Decoded Rx packet type related fields |
| * |
| * skb->protocol must be set before this function is called |
| */ |
| static void idpf_rx_csum(struct idpf_queue *rxq, struct sk_buff *skb, |
| struct idpf_rx_csum_decoded *csum_bits, |
| struct idpf_rx_ptype_decoded *decoded) |
| { |
| bool ipv4, ipv6; |
| |
| /* check if Rx checksum is enabled */ |
| if (unlikely(!idpf_is_feature_ena(rxq->vport, NETIF_F_RXCSUM))) |
| return; |
| |
| /* check if HW has decoded the packet and checksum */ |
| if (!(csum_bits->l3l4p)) |
| return; |
| |
| ipv4 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV4); |
| ipv6 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV6); |
| |
| if (ipv4 && (csum_bits->ipe || csum_bits->eipe)) |
| goto checksum_fail; |
| |
| if (ipv6 && csum_bits->ipv6exadd) |
| return; |
| |
| /* check for L4 errors and handle packets that were not able to be |
| * checksummed |
| */ |
| if (csum_bits->l4e) |
| goto checksum_fail; |
| |
| /* Only report checksum unnecessary for ICMP, TCP, UDP, or SCTP */ |
| switch (decoded->inner_prot) { |
| case IDPF_RX_PTYPE_INNER_PROT_ICMP: |
| case IDPF_RX_PTYPE_INNER_PROT_TCP: |
| case IDPF_RX_PTYPE_INNER_PROT_UDP: |
| if (!csum_bits->raw_csum_inv) { |
| u16 csum = csum_bits->raw_csum; |
| |
| skb->csum = csum_unfold((__force __sum16)~swab16(csum)); |
| skb->ip_summed = CHECKSUM_COMPLETE; |
| } else { |
| skb->ip_summed = CHECKSUM_UNNECESSARY; |
| } |
| break; |
| case IDPF_RX_PTYPE_INNER_PROT_SCTP: |
| skb->ip_summed = CHECKSUM_UNNECESSARY; |
| break; |
| default: |
| break; |
| } |
| |
| return; |
| |
| checksum_fail: |
| u64_stats_update_begin(&rxq->stats_sync); |
| u64_stats_inc(&rxq->q_stats.rx.hw_csum_err); |
| u64_stats_update_end(&rxq->stats_sync); |
| } |
| |
| /** |
| * idpf_rx_splitq_extract_csum_bits - Extract checksum bits from descriptor |
| * @rx_desc: receive descriptor |
| * @csum: structure to extract checksum fields |
| * |
| **/ |
| static void idpf_rx_splitq_extract_csum_bits(struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc, |
| struct idpf_rx_csum_decoded *csum) |
| { |
| u8 qword0, qword1; |
| |
| qword0 = rx_desc->status_err0_qw0; |
| qword1 = rx_desc->status_err0_qw1; |
| |
| csum->ipe = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_XSUM_IPE_M, |
| qword1); |
| csum->eipe = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_XSUM_EIPE_M, |
| qword1); |
| csum->l4e = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_XSUM_L4E_M, |
| qword1); |
| csum->l3l4p = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_L3L4P_M, |
| qword1); |
| csum->ipv6exadd = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_IPV6EXADD_M, |
| qword0); |
| csum->raw_csum_inv = |
| le16_get_bits(rx_desc->ptype_err_fflags0, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_RAW_CSUM_INV_M); |
| csum->raw_csum = le16_to_cpu(rx_desc->misc.raw_cs); |
| } |
| |
| /** |
| * idpf_rx_rsc - Set the RSC fields in the skb |
| * @rxq : Rx descriptor ring packet is being transacted on |
| * @skb : pointer to current skb being populated |
| * @rx_desc: Receive descriptor |
| * @decoded: Decoded Rx packet type related fields |
| * |
| * Return 0 on success and error code on failure |
| * |
| * Populate the skb fields with the total number of RSC segments, RSC payload |
| * length and packet type. |
| */ |
| static int idpf_rx_rsc(struct idpf_queue *rxq, struct sk_buff *skb, |
| struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc, |
| struct idpf_rx_ptype_decoded *decoded) |
| { |
| u16 rsc_segments, rsc_seg_len; |
| bool ipv4, ipv6; |
| int len; |
| |
| if (unlikely(!decoded->outer_ip)) |
| return -EINVAL; |
| |
| rsc_seg_len = le16_to_cpu(rx_desc->misc.rscseglen); |
| if (unlikely(!rsc_seg_len)) |
| return -EINVAL; |
| |
| ipv4 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV4); |
| ipv6 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV6); |
| |
| if (unlikely(!(ipv4 ^ ipv6))) |
| return -EINVAL; |
| |
| rsc_segments = DIV_ROUND_UP(skb->data_len, rsc_seg_len); |
| if (unlikely(rsc_segments == 1)) |
| return 0; |
| |
| NAPI_GRO_CB(skb)->count = rsc_segments; |
| skb_shinfo(skb)->gso_size = rsc_seg_len; |
| |
| skb_reset_network_header(skb); |
| len = skb->len - skb_transport_offset(skb); |
| |
| if (ipv4) { |
| struct iphdr *ipv4h = ip_hdr(skb); |
| |
| skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4; |
| |
| /* Reset and set transport header offset in skb */ |
| skb_set_transport_header(skb, sizeof(struct iphdr)); |
| |
| /* Compute the TCP pseudo header checksum*/ |
| tcp_hdr(skb)->check = |
| ~tcp_v4_check(len, ipv4h->saddr, ipv4h->daddr, 0); |
| } else { |
| struct ipv6hdr *ipv6h = ipv6_hdr(skb); |
| |
| skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6; |
| skb_set_transport_header(skb, sizeof(struct ipv6hdr)); |
| tcp_hdr(skb)->check = |
| ~tcp_v6_check(len, &ipv6h->saddr, &ipv6h->daddr, 0); |
| } |
| |
| tcp_gro_complete(skb); |
| |
| u64_stats_update_begin(&rxq->stats_sync); |
| u64_stats_inc(&rxq->q_stats.rx.rsc_pkts); |
| u64_stats_update_end(&rxq->stats_sync); |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_rx_process_skb_fields - Populate skb header fields from Rx descriptor |
| * @rxq: Rx descriptor ring packet is being transacted on |
| * @skb: pointer to current skb being populated |
| * @rx_desc: Receive descriptor |
| * |
| * This function checks the ring, descriptor, and packet information in |
| * order to populate the hash, checksum, protocol, and |
| * other fields within the skb. |
| */ |
| static int idpf_rx_process_skb_fields(struct idpf_queue *rxq, |
| struct sk_buff *skb, |
| struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc) |
| { |
| struct idpf_rx_csum_decoded csum_bits = { }; |
| struct idpf_rx_ptype_decoded decoded; |
| u16 rx_ptype; |
| |
| rx_ptype = le16_get_bits(rx_desc->ptype_err_fflags0, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_PTYPE_M); |
| |
| decoded = rxq->vport->rx_ptype_lkup[rx_ptype]; |
| /* If we don't know the ptype we can't do anything else with it. Just |
| * pass it up the stack as-is. |
| */ |
| if (!decoded.known) |
| return 0; |
| |
| /* process RSS/hash */ |
| idpf_rx_hash(rxq, skb, rx_desc, &decoded); |
| |
| skb->protocol = eth_type_trans(skb, rxq->vport->netdev); |
| |
| if (le16_get_bits(rx_desc->hdrlen_flags, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_RSC_M)) |
| return idpf_rx_rsc(rxq, skb, rx_desc, &decoded); |
| |
| idpf_rx_splitq_extract_csum_bits(rx_desc, &csum_bits); |
| idpf_rx_csum(rxq, skb, &csum_bits, &decoded); |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_rx_add_frag - Add contents of Rx buffer to sk_buff as a frag |
| * @rx_buf: buffer containing page to add |
| * @skb: sk_buff to place the data into |
| * @size: packet length from rx_desc |
| * |
| * This function will add the data contained in rx_buf->page to the skb. |
| * It will just attach the page as a frag to the skb. |
| * The function will then update the page offset. |
| */ |
| void idpf_rx_add_frag(struct idpf_rx_buf *rx_buf, struct sk_buff *skb, |
| unsigned int size) |
| { |
| skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags, rx_buf->page, |
| rx_buf->page_offset, size, rx_buf->truesize); |
| |
| rx_buf->page = NULL; |
| } |
| |
| /** |
| * idpf_rx_construct_skb - Allocate skb and populate it |
| * @rxq: Rx descriptor queue |
| * @rx_buf: Rx buffer to pull data from |
| * @size: the length of the packet |
| * |
| * This function allocates an skb. It then populates it with the page |
| * data from the current receive descriptor, taking care to set up the |
| * skb correctly. |
| */ |
| struct sk_buff *idpf_rx_construct_skb(struct idpf_queue *rxq, |
| struct idpf_rx_buf *rx_buf, |
| unsigned int size) |
| { |
| unsigned int headlen; |
| struct sk_buff *skb; |
| void *va; |
| |
| va = page_address(rx_buf->page) + rx_buf->page_offset; |
| |
| /* prefetch first cache line of first page */ |
| net_prefetch(va); |
| /* allocate a skb to store the frags */ |
| skb = __napi_alloc_skb(&rxq->q_vector->napi, IDPF_RX_HDR_SIZE, |
| GFP_ATOMIC); |
| if (unlikely(!skb)) { |
| idpf_rx_put_page(rx_buf); |
| |
| return NULL; |
| } |
| |
| skb_record_rx_queue(skb, rxq->idx); |
| skb_mark_for_recycle(skb); |
| |
| /* Determine available headroom for copy */ |
| headlen = size; |
| if (headlen > IDPF_RX_HDR_SIZE) |
| headlen = eth_get_headlen(skb->dev, va, IDPF_RX_HDR_SIZE); |
| |
| /* align pull length to size of long to optimize memcpy performance */ |
| memcpy(__skb_put(skb, headlen), va, ALIGN(headlen, sizeof(long))); |
| |
| /* if we exhaust the linear part then add what is left as a frag */ |
| size -= headlen; |
| if (!size) { |
| idpf_rx_put_page(rx_buf); |
| |
| return skb; |
| } |
| |
| skb_add_rx_frag(skb, 0, rx_buf->page, rx_buf->page_offset + headlen, |
| size, rx_buf->truesize); |
| |
| /* Since we're giving the page to the stack, clear our reference to it. |
| * We'll get a new one during buffer posting. |
| */ |
| rx_buf->page = NULL; |
| |
| return skb; |
| } |
| |
| /** |
| * idpf_rx_hdr_construct_skb - Allocate skb and populate it from header buffer |
| * @rxq: Rx descriptor queue |
| * @va: Rx buffer to pull data from |
| * @size: the length of the packet |
| * |
| * This function allocates an skb. It then populates it with the page data from |
| * the current receive descriptor, taking care to set up the skb correctly. |
| * This specifically uses a header buffer to start building the skb. |
| */ |
| static struct sk_buff *idpf_rx_hdr_construct_skb(struct idpf_queue *rxq, |
| const void *va, |
| unsigned int size) |
| { |
| struct sk_buff *skb; |
| |
| /* allocate a skb to store the frags */ |
| skb = __napi_alloc_skb(&rxq->q_vector->napi, size, GFP_ATOMIC); |
| if (unlikely(!skb)) |
| return NULL; |
| |
| skb_record_rx_queue(skb, rxq->idx); |
| |
| memcpy(__skb_put(skb, size), va, ALIGN(size, sizeof(long))); |
| |
| /* More than likely, a payload fragment, which will use a page from |
| * page_pool will be added to the SKB so mark it for recycle |
| * preemptively. And if not, it's inconsequential. |
| */ |
| skb_mark_for_recycle(skb); |
| |
| return skb; |
| } |
| |
| /** |
| * idpf_rx_splitq_test_staterr - tests bits in Rx descriptor |
| * status and error fields |
| * @stat_err_field: field from descriptor to test bits in |
| * @stat_err_bits: value to mask |
| * |
| */ |
| static bool idpf_rx_splitq_test_staterr(const u8 stat_err_field, |
| const u8 stat_err_bits) |
| { |
| return !!(stat_err_field & stat_err_bits); |
| } |
| |
| /** |
| * idpf_rx_splitq_is_eop - process handling of EOP buffers |
| * @rx_desc: Rx descriptor for current buffer |
| * |
| * If the buffer is an EOP buffer, this function exits returning true, |
| * otherwise return false indicating that this is in fact a non-EOP buffer. |
| */ |
| static bool idpf_rx_splitq_is_eop(struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc) |
| { |
| /* if we are the last buffer then there is nothing else to do */ |
| return likely(idpf_rx_splitq_test_staterr(rx_desc->status_err0_qw1, |
| IDPF_RXD_EOF_SPLITQ)); |
| } |
| |
| /** |
| * idpf_rx_splitq_clean - Clean completed descriptors from Rx queue |
| * @rxq: Rx descriptor queue to retrieve receive buffer queue |
| * @budget: Total limit on number of packets to process |
| * |
| * This function provides a "bounce buffer" approach to Rx interrupt |
| * processing. The advantage to this is that on systems that have |
| * expensive overhead for IOMMU access this provides a means of avoiding |
| * it by maintaining the mapping of the page to the system. |
| * |
| * Returns amount of work completed |
| */ |
| static int idpf_rx_splitq_clean(struct idpf_queue *rxq, int budget) |
| { |
| int total_rx_bytes = 0, total_rx_pkts = 0; |
| struct idpf_queue *rx_bufq = NULL; |
| struct sk_buff *skb = rxq->skb; |
| u16 ntc = rxq->next_to_clean; |
| |
| /* Process Rx packets bounded by budget */ |
| while (likely(total_rx_pkts < budget)) { |
| struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc; |
| struct idpf_sw_queue *refillq = NULL; |
| struct idpf_rxq_set *rxq_set = NULL; |
| struct idpf_rx_buf *rx_buf = NULL; |
| union virtchnl2_rx_desc *desc; |
| unsigned int pkt_len = 0; |
| unsigned int hdr_len = 0; |
| u16 gen_id, buf_id = 0; |
| /* Header buffer overflow only valid for header split */ |
| bool hbo = false; |
| int bufq_id; |
| u8 rxdid; |
| |
| /* get the Rx desc from Rx queue based on 'next_to_clean' */ |
| desc = IDPF_RX_DESC(rxq, ntc); |
| rx_desc = (struct virtchnl2_rx_flex_desc_adv_nic_3 *)desc; |
| |
| /* This memory barrier is needed to keep us from reading |
| * any other fields out of the rx_desc |
| */ |
| dma_rmb(); |
| |
| /* if the descriptor isn't done, no work yet to do */ |
| gen_id = le16_get_bits(rx_desc->pktlen_gen_bufq_id, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_GEN_M); |
| |
| if (test_bit(__IDPF_Q_GEN_CHK, rxq->flags) != gen_id) |
| break; |
| |
| rxdid = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_RXDID_M, |
| rx_desc->rxdid_ucast); |
| if (rxdid != VIRTCHNL2_RXDID_2_FLEX_SPLITQ) { |
| IDPF_RX_BUMP_NTC(rxq, ntc); |
| u64_stats_update_begin(&rxq->stats_sync); |
| u64_stats_inc(&rxq->q_stats.rx.bad_descs); |
| u64_stats_update_end(&rxq->stats_sync); |
| continue; |
| } |
| |
| pkt_len = le16_get_bits(rx_desc->pktlen_gen_bufq_id, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_LEN_PBUF_M); |
| |
| hbo = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_HBO_M, |
| rx_desc->status_err0_qw1); |
| |
| if (unlikely(hbo)) { |
| /* If a header buffer overflow, occurs, i.e. header is |
| * too large to fit in the header split buffer, HW will |
| * put the entire packet, including headers, in the |
| * data/payload buffer. |
| */ |
| u64_stats_update_begin(&rxq->stats_sync); |
| u64_stats_inc(&rxq->q_stats.rx.hsplit_buf_ovf); |
| u64_stats_update_end(&rxq->stats_sync); |
| goto bypass_hsplit; |
| } |
| |
| hdr_len = le16_get_bits(rx_desc->hdrlen_flags, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_LEN_HDR_M); |
| |
| bypass_hsplit: |
| bufq_id = le16_get_bits(rx_desc->pktlen_gen_bufq_id, |
| VIRTCHNL2_RX_FLEX_DESC_ADV_BUFQ_ID_M); |
| |
| rxq_set = container_of(rxq, struct idpf_rxq_set, rxq); |
| if (!bufq_id) |
| refillq = rxq_set->refillq0; |
| else |
| refillq = rxq_set->refillq1; |
| |
| /* retrieve buffer from the rxq */ |
| rx_bufq = &rxq->rxq_grp->splitq.bufq_sets[bufq_id].bufq; |
| |
| buf_id = le16_to_cpu(rx_desc->buf_id); |
| |
| rx_buf = &rx_bufq->rx_buf.buf[buf_id]; |
| |
| if (hdr_len) { |
| const void *va = (u8 *)rx_bufq->rx_buf.hdr_buf_va + |
| (u32)buf_id * IDPF_HDR_BUF_SIZE; |
| |
| skb = idpf_rx_hdr_construct_skb(rxq, va, hdr_len); |
| u64_stats_update_begin(&rxq->stats_sync); |
| u64_stats_inc(&rxq->q_stats.rx.hsplit_pkts); |
| u64_stats_update_end(&rxq->stats_sync); |
| } |
| |
| if (pkt_len) { |
| idpf_rx_sync_for_cpu(rx_buf, pkt_len); |
| if (skb) |
| idpf_rx_add_frag(rx_buf, skb, pkt_len); |
| else |
| skb = idpf_rx_construct_skb(rxq, rx_buf, |
| pkt_len); |
| } else { |
| idpf_rx_put_page(rx_buf); |
| } |
| |
| /* exit if we failed to retrieve a buffer */ |
| if (!skb) |
| break; |
| |
| idpf_rx_post_buf_refill(refillq, buf_id); |
| |
| IDPF_RX_BUMP_NTC(rxq, ntc); |
| /* skip if it is non EOP desc */ |
| if (!idpf_rx_splitq_is_eop(rx_desc)) |
| continue; |
| |
| /* pad skb if needed (to make valid ethernet frame) */ |
| if (eth_skb_pad(skb)) { |
| skb = NULL; |
| continue; |
| } |
| |
| /* probably a little skewed due to removing CRC */ |
| total_rx_bytes += skb->len; |
| |
| /* protocol */ |
| if (unlikely(idpf_rx_process_skb_fields(rxq, skb, rx_desc))) { |
| dev_kfree_skb_any(skb); |
| skb = NULL; |
| continue; |
| } |
| |
| /* send completed skb up the stack */ |
| napi_gro_receive(&rxq->q_vector->napi, skb); |
| skb = NULL; |
| |
| /* update budget accounting */ |
| total_rx_pkts++; |
| } |
| |
| rxq->next_to_clean = ntc; |
| |
| rxq->skb = skb; |
| u64_stats_update_begin(&rxq->stats_sync); |
| u64_stats_add(&rxq->q_stats.rx.packets, total_rx_pkts); |
| u64_stats_add(&rxq->q_stats.rx.bytes, total_rx_bytes); |
| u64_stats_update_end(&rxq->stats_sync); |
| |
| /* guarantee a trip back through this routine if there was a failure */ |
| return total_rx_pkts; |
| } |
| |
| /** |
| * idpf_rx_update_bufq_desc - Update buffer queue descriptor |
| * @bufq: Pointer to the buffer queue |
| * @refill_desc: SW Refill queue descriptor containing buffer ID |
| * @buf_desc: Buffer queue descriptor |
| * |
| * Return 0 on success and negative on failure. |
| */ |
| static int idpf_rx_update_bufq_desc(struct idpf_queue *bufq, u16 refill_desc, |
| struct virtchnl2_splitq_rx_buf_desc *buf_desc) |
| { |
| struct idpf_rx_buf *buf; |
| dma_addr_t addr; |
| u16 buf_id; |
| |
| buf_id = FIELD_GET(IDPF_RX_BI_BUFID_M, refill_desc); |
| |
| buf = &bufq->rx_buf.buf[buf_id]; |
| |
| addr = idpf_alloc_page(bufq->pp, buf, bufq->rx_buf_size); |
| if (unlikely(addr == DMA_MAPPING_ERROR)) |
| return -ENOMEM; |
| |
| buf_desc->pkt_addr = cpu_to_le64(addr); |
| buf_desc->qword0.buf_id = cpu_to_le16(buf_id); |
| |
| if (!bufq->rx_hsplit_en) |
| return 0; |
| |
| buf_desc->hdr_addr = cpu_to_le64(bufq->rx_buf.hdr_buf_pa + |
| (u32)buf_id * IDPF_HDR_BUF_SIZE); |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_rx_clean_refillq - Clean refill queue buffers |
| * @bufq: buffer queue to post buffers back to |
| * @refillq: refill queue to clean |
| * |
| * This function takes care of the buffer refill management |
| */ |
| static void idpf_rx_clean_refillq(struct idpf_queue *bufq, |
| struct idpf_sw_queue *refillq) |
| { |
| struct virtchnl2_splitq_rx_buf_desc *buf_desc; |
| u16 bufq_nta = bufq->next_to_alloc; |
| u16 ntc = refillq->next_to_clean; |
| int cleaned = 0; |
| u16 gen; |
| |
| buf_desc = IDPF_SPLITQ_RX_BUF_DESC(bufq, bufq_nta); |
| |
| /* make sure we stop at ring wrap in the unlikely case ring is full */ |
| while (likely(cleaned < refillq->desc_count)) { |
| u16 refill_desc = IDPF_SPLITQ_RX_BI_DESC(refillq, ntc); |
| bool failure; |
| |
| gen = FIELD_GET(IDPF_RX_BI_GEN_M, refill_desc); |
| if (test_bit(__IDPF_RFLQ_GEN_CHK, refillq->flags) != gen) |
| break; |
| |
| failure = idpf_rx_update_bufq_desc(bufq, refill_desc, |
| buf_desc); |
| if (failure) |
| break; |
| |
| if (unlikely(++ntc == refillq->desc_count)) { |
| change_bit(__IDPF_RFLQ_GEN_CHK, refillq->flags); |
| ntc = 0; |
| } |
| |
| if (unlikely(++bufq_nta == bufq->desc_count)) { |
| buf_desc = IDPF_SPLITQ_RX_BUF_DESC(bufq, 0); |
| bufq_nta = 0; |
| } else { |
| buf_desc++; |
| } |
| |
| cleaned++; |
| } |
| |
| if (!cleaned) |
| return; |
| |
| /* We want to limit how many transactions on the bus we trigger with |
| * tail writes so we only do it in strides. It's also important we |
| * align the write to a multiple of 8 as required by HW. |
| */ |
| if (((bufq->next_to_use <= bufq_nta ? 0 : bufq->desc_count) + |
| bufq_nta - bufq->next_to_use) >= IDPF_RX_BUF_POST_STRIDE) |
| idpf_rx_buf_hw_update(bufq, ALIGN_DOWN(bufq_nta, |
| IDPF_RX_BUF_POST_STRIDE)); |
| |
| /* update next to alloc since we have filled the ring */ |
| refillq->next_to_clean = ntc; |
| bufq->next_to_alloc = bufq_nta; |
| } |
| |
| /** |
| * idpf_rx_clean_refillq_all - Clean all refill queues |
| * @bufq: buffer queue with refill queues |
| * |
| * Iterates through all refill queues assigned to the buffer queue assigned to |
| * this vector. Returns true if clean is complete within budget, false |
| * otherwise. |
| */ |
| static void idpf_rx_clean_refillq_all(struct idpf_queue *bufq) |
| { |
| struct idpf_bufq_set *bufq_set; |
| int i; |
| |
| bufq_set = container_of(bufq, struct idpf_bufq_set, bufq); |
| for (i = 0; i < bufq_set->num_refillqs; i++) |
| idpf_rx_clean_refillq(bufq, &bufq_set->refillqs[i]); |
| } |
| |
| /** |
| * idpf_vport_intr_clean_queues - MSIX mode Interrupt Handler |
| * @irq: interrupt number |
| * @data: pointer to a q_vector |
| * |
| */ |
| static irqreturn_t idpf_vport_intr_clean_queues(int __always_unused irq, |
| void *data) |
| { |
| struct idpf_q_vector *q_vector = (struct idpf_q_vector *)data; |
| |
| q_vector->total_events++; |
| napi_schedule(&q_vector->napi); |
| |
| return IRQ_HANDLED; |
| } |
| |
| /** |
| * idpf_vport_intr_napi_del_all - Unregister napi for all q_vectors in vport |
| * @vport: virtual port structure |
| * |
| */ |
| static void idpf_vport_intr_napi_del_all(struct idpf_vport *vport) |
| { |
| u16 v_idx; |
| |
| for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) |
| netif_napi_del(&vport->q_vectors[v_idx].napi); |
| } |
| |
| /** |
| * idpf_vport_intr_napi_dis_all - Disable NAPI for all q_vectors in the vport |
| * @vport: main vport structure |
| */ |
| static void idpf_vport_intr_napi_dis_all(struct idpf_vport *vport) |
| { |
| int v_idx; |
| |
| for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) |
| napi_disable(&vport->q_vectors[v_idx].napi); |
| } |
| |
| /** |
| * idpf_vport_intr_rel - Free memory allocated for interrupt vectors |
| * @vport: virtual port |
| * |
| * Free the memory allocated for interrupt vectors associated to a vport |
| */ |
| void idpf_vport_intr_rel(struct idpf_vport *vport) |
| { |
| int i, j, v_idx; |
| |
| for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) { |
| struct idpf_q_vector *q_vector = &vport->q_vectors[v_idx]; |
| |
| kfree(q_vector->bufq); |
| q_vector->bufq = NULL; |
| kfree(q_vector->tx); |
| q_vector->tx = NULL; |
| kfree(q_vector->rx); |
| q_vector->rx = NULL; |
| } |
| |
| /* Clean up the mapping of queues to vectors */ |
| for (i = 0; i < vport->num_rxq_grp; i++) { |
| struct idpf_rxq_group *rx_qgrp = &vport->rxq_grps[i]; |
| |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| for (j = 0; j < rx_qgrp->splitq.num_rxq_sets; j++) |
| rx_qgrp->splitq.rxq_sets[j]->rxq.q_vector = NULL; |
| else |
| for (j = 0; j < rx_qgrp->singleq.num_rxq; j++) |
| rx_qgrp->singleq.rxqs[j]->q_vector = NULL; |
| } |
| |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| for (i = 0; i < vport->num_txq_grp; i++) |
| vport->txq_grps[i].complq->q_vector = NULL; |
| else |
| for (i = 0; i < vport->num_txq_grp; i++) |
| for (j = 0; j < vport->txq_grps[i].num_txq; j++) |
| vport->txq_grps[i].txqs[j]->q_vector = NULL; |
| |
| kfree(vport->q_vectors); |
| vport->q_vectors = NULL; |
| } |
| |
| /** |
| * idpf_vport_intr_rel_irq - Free the IRQ association with the OS |
| * @vport: main vport structure |
| */ |
| static void idpf_vport_intr_rel_irq(struct idpf_vport *vport) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| int vector; |
| |
| for (vector = 0; vector < vport->num_q_vectors; vector++) { |
| struct idpf_q_vector *q_vector = &vport->q_vectors[vector]; |
| int irq_num, vidx; |
| |
| /* free only the irqs that were actually requested */ |
| if (!q_vector) |
| continue; |
| |
| vidx = vport->q_vector_idxs[vector]; |
| irq_num = adapter->msix_entries[vidx].vector; |
| |
| /* clear the affinity_mask in the IRQ descriptor */ |
| irq_set_affinity_hint(irq_num, NULL); |
| free_irq(irq_num, q_vector); |
| } |
| } |
| |
| /** |
| * idpf_vport_intr_dis_irq_all - Disable all interrupt |
| * @vport: main vport structure |
| */ |
| static void idpf_vport_intr_dis_irq_all(struct idpf_vport *vport) |
| { |
| struct idpf_q_vector *q_vector = vport->q_vectors; |
| int q_idx; |
| |
| for (q_idx = 0; q_idx < vport->num_q_vectors; q_idx++) |
| writel(0, q_vector[q_idx].intr_reg.dyn_ctl); |
| } |
| |
| /** |
| * idpf_vport_intr_buildreg_itr - Enable default interrupt generation settings |
| * @q_vector: pointer to q_vector |
| * @type: itr index |
| * @itr: itr value |
| */ |
| static u32 idpf_vport_intr_buildreg_itr(struct idpf_q_vector *q_vector, |
| const int type, u16 itr) |
| { |
| u32 itr_val; |
| |
| itr &= IDPF_ITR_MASK; |
| /* Don't clear PBA because that can cause lost interrupts that |
| * came in while we were cleaning/polling |
| */ |
| itr_val = q_vector->intr_reg.dyn_ctl_intena_m | |
| (type << q_vector->intr_reg.dyn_ctl_itridx_s) | |
| (itr << (q_vector->intr_reg.dyn_ctl_intrvl_s - 1)); |
| |
| return itr_val; |
| } |
| |
| /** |
| * idpf_update_dim_sample - Update dim sample with packets and bytes |
| * @q_vector: the vector associated with the interrupt |
| * @dim_sample: dim sample to update |
| * @dim: dim instance structure |
| * @packets: total packets |
| * @bytes: total bytes |
| * |
| * Update the dim sample with the packets and bytes which are passed to this |
| * function. Set the dim state appropriately if the dim settings gets stale. |
| */ |
| static void idpf_update_dim_sample(struct idpf_q_vector *q_vector, |
| struct dim_sample *dim_sample, |
| struct dim *dim, u64 packets, u64 bytes) |
| { |
| dim_update_sample(q_vector->total_events, packets, bytes, dim_sample); |
| dim_sample->comp_ctr = 0; |
| |
| /* if dim settings get stale, like when not updated for 1 second or |
| * longer, force it to start again. This addresses the frequent case |
| * of an idle queue being switched to by the scheduler. |
| */ |
| if (ktime_ms_delta(dim_sample->time, dim->start_sample.time) >= HZ) |
| dim->state = DIM_START_MEASURE; |
| } |
| |
| /** |
| * idpf_net_dim - Update net DIM algorithm |
| * @q_vector: the vector associated with the interrupt |
| * |
| * Create a DIM sample and notify net_dim() so that it can possibly decide |
| * a new ITR value based on incoming packets, bytes, and interrupts. |
| * |
| * This function is a no-op if the queue is not configured to dynamic ITR. |
| */ |
| static void idpf_net_dim(struct idpf_q_vector *q_vector) |
| { |
| struct dim_sample dim_sample = { }; |
| u64 packets, bytes; |
| u32 i; |
| |
| if (!IDPF_ITR_IS_DYNAMIC(q_vector->tx_intr_mode)) |
| goto check_rx_itr; |
| |
| for (i = 0, packets = 0, bytes = 0; i < q_vector->num_txq; i++) { |
| struct idpf_queue *txq = q_vector->tx[i]; |
| unsigned int start; |
| |
| do { |
| start = u64_stats_fetch_begin(&txq->stats_sync); |
| packets += u64_stats_read(&txq->q_stats.tx.packets); |
| bytes += u64_stats_read(&txq->q_stats.tx.bytes); |
| } while (u64_stats_fetch_retry(&txq->stats_sync, start)); |
| } |
| |
| idpf_update_dim_sample(q_vector, &dim_sample, &q_vector->tx_dim, |
| packets, bytes); |
| net_dim(&q_vector->tx_dim, dim_sample); |
| |
| check_rx_itr: |
| if (!IDPF_ITR_IS_DYNAMIC(q_vector->rx_intr_mode)) |
| return; |
| |
| for (i = 0, packets = 0, bytes = 0; i < q_vector->num_rxq; i++) { |
| struct idpf_queue *rxq = q_vector->rx[i]; |
| unsigned int start; |
| |
| do { |
| start = u64_stats_fetch_begin(&rxq->stats_sync); |
| packets += u64_stats_read(&rxq->q_stats.rx.packets); |
| bytes += u64_stats_read(&rxq->q_stats.rx.bytes); |
| } while (u64_stats_fetch_retry(&rxq->stats_sync, start)); |
| } |
| |
| idpf_update_dim_sample(q_vector, &dim_sample, &q_vector->rx_dim, |
| packets, bytes); |
| net_dim(&q_vector->rx_dim, dim_sample); |
| } |
| |
| /** |
| * idpf_vport_intr_update_itr_ena_irq - Update itr and re-enable MSIX interrupt |
| * @q_vector: q_vector for which itr is being updated and interrupt enabled |
| * |
| * Update the net_dim() algorithm and re-enable the interrupt associated with |
| * this vector. |
| */ |
| void idpf_vport_intr_update_itr_ena_irq(struct idpf_q_vector *q_vector) |
| { |
| u32 intval; |
| |
| /* net_dim() updates ITR out-of-band using a work item */ |
| idpf_net_dim(q_vector); |
| |
| intval = idpf_vport_intr_buildreg_itr(q_vector, |
| IDPF_NO_ITR_UPDATE_IDX, 0); |
| |
| writel(intval, q_vector->intr_reg.dyn_ctl); |
| } |
| |
| /** |
| * idpf_vport_intr_req_irq - get MSI-X vectors from the OS for the vport |
| * @vport: main vport structure |
| * @basename: name for the vector |
| */ |
| static int idpf_vport_intr_req_irq(struct idpf_vport *vport, char *basename) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| int vector, err, irq_num, vidx; |
| const char *vec_name; |
| |
| for (vector = 0; vector < vport->num_q_vectors; vector++) { |
| struct idpf_q_vector *q_vector = &vport->q_vectors[vector]; |
| |
| vidx = vport->q_vector_idxs[vector]; |
| irq_num = adapter->msix_entries[vidx].vector; |
| |
| if (q_vector->num_rxq && q_vector->num_txq) |
| vec_name = "TxRx"; |
| else if (q_vector->num_rxq) |
| vec_name = "Rx"; |
| else if (q_vector->num_txq) |
| vec_name = "Tx"; |
| else |
| continue; |
| |
| q_vector->name = kasprintf(GFP_KERNEL, "%s-%s-%d", |
| basename, vec_name, vidx); |
| |
| err = request_irq(irq_num, idpf_vport_intr_clean_queues, 0, |
| q_vector->name, q_vector); |
| if (err) { |
| netdev_err(vport->netdev, |
| "Request_irq failed, error: %d\n", err); |
| goto free_q_irqs; |
| } |
| /* assign the mask for this irq */ |
| irq_set_affinity_hint(irq_num, &q_vector->affinity_mask); |
| } |
| |
| return 0; |
| |
| free_q_irqs: |
| while (--vector >= 0) { |
| vidx = vport->q_vector_idxs[vector]; |
| irq_num = adapter->msix_entries[vidx].vector; |
| free_irq(irq_num, &vport->q_vectors[vector]); |
| } |
| |
| return err; |
| } |
| |
| /** |
| * idpf_vport_intr_write_itr - Write ITR value to the ITR register |
| * @q_vector: q_vector structure |
| * @itr: Interrupt throttling rate |
| * @tx: Tx or Rx ITR |
| */ |
| void idpf_vport_intr_write_itr(struct idpf_q_vector *q_vector, u16 itr, bool tx) |
| { |
| struct idpf_intr_reg *intr_reg; |
| |
| if (tx && !q_vector->tx) |
| return; |
| else if (!tx && !q_vector->rx) |
| return; |
| |
| intr_reg = &q_vector->intr_reg; |
| writel(ITR_REG_ALIGN(itr) >> IDPF_ITR_GRAN_S, |
| tx ? intr_reg->tx_itr : intr_reg->rx_itr); |
| } |
| |
| /** |
| * idpf_vport_intr_ena_irq_all - Enable IRQ for the given vport |
| * @vport: main vport structure |
| */ |
| static void idpf_vport_intr_ena_irq_all(struct idpf_vport *vport) |
| { |
| bool dynamic; |
| int q_idx; |
| u16 itr; |
| |
| for (q_idx = 0; q_idx < vport->num_q_vectors; q_idx++) { |
| struct idpf_q_vector *qv = &vport->q_vectors[q_idx]; |
| |
| /* Set the initial ITR values */ |
| if (qv->num_txq) { |
| dynamic = IDPF_ITR_IS_DYNAMIC(qv->tx_intr_mode); |
| itr = vport->tx_itr_profile[qv->tx_dim.profile_ix]; |
| idpf_vport_intr_write_itr(qv, dynamic ? |
| itr : qv->tx_itr_value, |
| true); |
| } |
| |
| if (qv->num_rxq) { |
| dynamic = IDPF_ITR_IS_DYNAMIC(qv->rx_intr_mode); |
| itr = vport->rx_itr_profile[qv->rx_dim.profile_ix]; |
| idpf_vport_intr_write_itr(qv, dynamic ? |
| itr : qv->rx_itr_value, |
| false); |
| } |
| |
| if (qv->num_txq || qv->num_rxq) |
| idpf_vport_intr_update_itr_ena_irq(qv); |
| } |
| } |
| |
| /** |
| * idpf_vport_intr_deinit - Release all vector associations for the vport |
| * @vport: main vport structure |
| */ |
| void idpf_vport_intr_deinit(struct idpf_vport *vport) |
| { |
| idpf_vport_intr_napi_dis_all(vport); |
| idpf_vport_intr_napi_del_all(vport); |
| idpf_vport_intr_dis_irq_all(vport); |
| idpf_vport_intr_rel_irq(vport); |
| } |
| |
| /** |
| * idpf_tx_dim_work - Call back from the stack |
| * @work: work queue structure |
| */ |
| static void idpf_tx_dim_work(struct work_struct *work) |
| { |
| struct idpf_q_vector *q_vector; |
| struct idpf_vport *vport; |
| struct dim *dim; |
| u16 itr; |
| |
| dim = container_of(work, struct dim, work); |
| q_vector = container_of(dim, struct idpf_q_vector, tx_dim); |
| vport = q_vector->vport; |
| |
| if (dim->profile_ix >= ARRAY_SIZE(vport->tx_itr_profile)) |
| dim->profile_ix = ARRAY_SIZE(vport->tx_itr_profile) - 1; |
| |
| /* look up the values in our local table */ |
| itr = vport->tx_itr_profile[dim->profile_ix]; |
| |
| idpf_vport_intr_write_itr(q_vector, itr, true); |
| |
| dim->state = DIM_START_MEASURE; |
| } |
| |
| /** |
| * idpf_rx_dim_work - Call back from the stack |
| * @work: work queue structure |
| */ |
| static void idpf_rx_dim_work(struct work_struct *work) |
| { |
| struct idpf_q_vector *q_vector; |
| struct idpf_vport *vport; |
| struct dim *dim; |
| u16 itr; |
| |
| dim = container_of(work, struct dim, work); |
| q_vector = container_of(dim, struct idpf_q_vector, rx_dim); |
| vport = q_vector->vport; |
| |
| if (dim->profile_ix >= ARRAY_SIZE(vport->rx_itr_profile)) |
| dim->profile_ix = ARRAY_SIZE(vport->rx_itr_profile) - 1; |
| |
| /* look up the values in our local table */ |
| itr = vport->rx_itr_profile[dim->profile_ix]; |
| |
| idpf_vport_intr_write_itr(q_vector, itr, false); |
| |
| dim->state = DIM_START_MEASURE; |
| } |
| |
| /** |
| * idpf_init_dim - Set up dynamic interrupt moderation |
| * @qv: q_vector structure |
| */ |
| static void idpf_init_dim(struct idpf_q_vector *qv) |
| { |
| INIT_WORK(&qv->tx_dim.work, idpf_tx_dim_work); |
| qv->tx_dim.mode = DIM_CQ_PERIOD_MODE_START_FROM_EQE; |
| qv->tx_dim.profile_ix = IDPF_DIM_DEFAULT_PROFILE_IX; |
| |
| INIT_WORK(&qv->rx_dim.work, idpf_rx_dim_work); |
| qv->rx_dim.mode = DIM_CQ_PERIOD_MODE_START_FROM_EQE; |
| qv->rx_dim.profile_ix = IDPF_DIM_DEFAULT_PROFILE_IX; |
| } |
| |
| /** |
| * idpf_vport_intr_napi_ena_all - Enable NAPI for all q_vectors in the vport |
| * @vport: main vport structure |
| */ |
| static void idpf_vport_intr_napi_ena_all(struct idpf_vport *vport) |
| { |
| int q_idx; |
| |
| for (q_idx = 0; q_idx < vport->num_q_vectors; q_idx++) { |
| struct idpf_q_vector *q_vector = &vport->q_vectors[q_idx]; |
| |
| idpf_init_dim(q_vector); |
| napi_enable(&q_vector->napi); |
| } |
| } |
| |
| /** |
| * idpf_tx_splitq_clean_all- Clean completion queues |
| * @q_vec: queue vector |
| * @budget: Used to determine if we are in netpoll |
| * @cleaned: returns number of packets cleaned |
| * |
| * Returns false if clean is not complete else returns true |
| */ |
| static bool idpf_tx_splitq_clean_all(struct idpf_q_vector *q_vec, |
| int budget, int *cleaned) |
| { |
| u16 num_txq = q_vec->num_txq; |
| bool clean_complete = true; |
| int i, budget_per_q; |
| |
| if (unlikely(!num_txq)) |
| return true; |
| |
| budget_per_q = DIV_ROUND_UP(budget, num_txq); |
| for (i = 0; i < num_txq; i++) |
| clean_complete &= idpf_tx_clean_complq(q_vec->tx[i], |
| budget_per_q, cleaned); |
| |
| return clean_complete; |
| } |
| |
| /** |
| * idpf_rx_splitq_clean_all- Clean completion queues |
| * @q_vec: queue vector |
| * @budget: Used to determine if we are in netpoll |
| * @cleaned: returns number of packets cleaned |
| * |
| * Returns false if clean is not complete else returns true |
| */ |
| static bool idpf_rx_splitq_clean_all(struct idpf_q_vector *q_vec, int budget, |
| int *cleaned) |
| { |
| u16 num_rxq = q_vec->num_rxq; |
| bool clean_complete = true; |
| int pkts_cleaned = 0; |
| int i, budget_per_q; |
| |
| /* We attempt to distribute budget to each Rx queue fairly, but don't |
| * allow the budget to go below 1 because that would exit polling early. |
| */ |
| budget_per_q = num_rxq ? max(budget / num_rxq, 1) : 0; |
| for (i = 0; i < num_rxq; i++) { |
| struct idpf_queue *rxq = q_vec->rx[i]; |
| int pkts_cleaned_per_q; |
| |
| pkts_cleaned_per_q = idpf_rx_splitq_clean(rxq, budget_per_q); |
| /* if we clean as many as budgeted, we must not be done */ |
| if (pkts_cleaned_per_q >= budget_per_q) |
| clean_complete = false; |
| pkts_cleaned += pkts_cleaned_per_q; |
| } |
| *cleaned = pkts_cleaned; |
| |
| for (i = 0; i < q_vec->num_bufq; i++) |
| idpf_rx_clean_refillq_all(q_vec->bufq[i]); |
| |
| return clean_complete; |
| } |
| |
| /** |
| * idpf_vport_splitq_napi_poll - NAPI handler |
| * @napi: struct from which you get q_vector |
| * @budget: budget provided by stack |
| */ |
| static int idpf_vport_splitq_napi_poll(struct napi_struct *napi, int budget) |
| { |
| struct idpf_q_vector *q_vector = |
| container_of(napi, struct idpf_q_vector, napi); |
| bool clean_complete; |
| int work_done = 0; |
| |
| /* Handle case where we are called by netpoll with a budget of 0 */ |
| if (unlikely(!budget)) { |
| idpf_tx_splitq_clean_all(q_vector, budget, &work_done); |
| |
| return 0; |
| } |
| |
| clean_complete = idpf_rx_splitq_clean_all(q_vector, budget, &work_done); |
| clean_complete &= idpf_tx_splitq_clean_all(q_vector, budget, &work_done); |
| |
| /* If work not completed, return budget and polling will return */ |
| if (!clean_complete) |
| return budget; |
| |
| work_done = min_t(int, work_done, budget - 1); |
| |
| /* Exit the polling mode, but don't re-enable interrupts if stack might |
| * poll us due to busy-polling |
| */ |
| if (likely(napi_complete_done(napi, work_done))) |
| idpf_vport_intr_update_itr_ena_irq(q_vector); |
| |
| /* Switch to poll mode in the tear-down path after sending disable |
| * queues virtchnl message, as the interrupts will be disabled after |
| * that |
| */ |
| if (unlikely(q_vector->num_txq && test_bit(__IDPF_Q_POLL_MODE, |
| q_vector->tx[0]->flags))) |
| return budget; |
| else |
| return work_done; |
| } |
| |
| /** |
| * idpf_vport_intr_map_vector_to_qs - Map vectors to queues |
| * @vport: virtual port |
| * |
| * Mapping for vectors to queues |
| */ |
| static void idpf_vport_intr_map_vector_to_qs(struct idpf_vport *vport) |
| { |
| u16 num_txq_grp = vport->num_txq_grp; |
| int i, j, qv_idx, bufq_vidx = 0; |
| struct idpf_rxq_group *rx_qgrp; |
| struct idpf_txq_group *tx_qgrp; |
| struct idpf_queue *q, *bufq; |
| u16 q_index; |
| |
| for (i = 0, qv_idx = 0; i < vport->num_rxq_grp; i++) { |
| u16 num_rxq; |
| |
| rx_qgrp = &vport->rxq_grps[i]; |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| num_rxq = rx_qgrp->splitq.num_rxq_sets; |
| else |
| num_rxq = rx_qgrp->singleq.num_rxq; |
| |
| for (j = 0; j < num_rxq; j++) { |
| if (qv_idx >= vport->num_q_vectors) |
| qv_idx = 0; |
| |
| if (idpf_is_queue_model_split(vport->rxq_model)) |
| q = &rx_qgrp->splitq.rxq_sets[j]->rxq; |
| else |
| q = rx_qgrp->singleq.rxqs[j]; |
| q->q_vector = &vport->q_vectors[qv_idx]; |
| q_index = q->q_vector->num_rxq; |
| q->q_vector->rx[q_index] = q; |
| q->q_vector->num_rxq++; |
| qv_idx++; |
| } |
| |
| if (idpf_is_queue_model_split(vport->rxq_model)) { |
| for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { |
| bufq = &rx_qgrp->splitq.bufq_sets[j].bufq; |
| bufq->q_vector = &vport->q_vectors[bufq_vidx]; |
| q_index = bufq->q_vector->num_bufq; |
| bufq->q_vector->bufq[q_index] = bufq; |
| bufq->q_vector->num_bufq++; |
| } |
| if (++bufq_vidx >= vport->num_q_vectors) |
| bufq_vidx = 0; |
| } |
| } |
| |
| for (i = 0, qv_idx = 0; i < num_txq_grp; i++) { |
| u16 num_txq; |
| |
| tx_qgrp = &vport->txq_grps[i]; |
| num_txq = tx_qgrp->num_txq; |
| |
| if (idpf_is_queue_model_split(vport->txq_model)) { |
| if (qv_idx >= vport->num_q_vectors) |
| qv_idx = 0; |
| |
| q = tx_qgrp->complq; |
| q->q_vector = &vport->q_vectors[qv_idx]; |
| q_index = q->q_vector->num_txq; |
| q->q_vector->tx[q_index] = q; |
| q->q_vector->num_txq++; |
| qv_idx++; |
| } else { |
| for (j = 0; j < num_txq; j++) { |
| if (qv_idx >= vport->num_q_vectors) |
| qv_idx = 0; |
| |
| q = tx_qgrp->txqs[j]; |
| q->q_vector = &vport->q_vectors[qv_idx]; |
| q_index = q->q_vector->num_txq; |
| q->q_vector->tx[q_index] = q; |
| q->q_vector->num_txq++; |
| |
| qv_idx++; |
| } |
| } |
| } |
| } |
| |
| /** |
| * idpf_vport_intr_init_vec_idx - Initialize the vector indexes |
| * @vport: virtual port |
| * |
| * Initialize vector indexes with values returened over mailbox |
| */ |
| static int idpf_vport_intr_init_vec_idx(struct idpf_vport *vport) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| struct virtchnl2_alloc_vectors *ac; |
| u16 *vecids, total_vecs; |
| int i; |
| |
| ac = adapter->req_vec_chunks; |
| if (!ac) { |
| for (i = 0; i < vport->num_q_vectors; i++) |
| vport->q_vectors[i].v_idx = vport->q_vector_idxs[i]; |
| |
| return 0; |
| } |
| |
| total_vecs = idpf_get_reserved_vecs(adapter); |
| vecids = kcalloc(total_vecs, sizeof(u16), GFP_KERNEL); |
| if (!vecids) |
| return -ENOMEM; |
| |
| idpf_get_vec_ids(adapter, vecids, total_vecs, &ac->vchunks); |
| |
| for (i = 0; i < vport->num_q_vectors; i++) |
| vport->q_vectors[i].v_idx = vecids[vport->q_vector_idxs[i]]; |
| |
| kfree(vecids); |
| |
| return 0; |
| } |
| |
| /** |
| * idpf_vport_intr_napi_add_all- Register napi handler for all qvectors |
| * @vport: virtual port structure |
| */ |
| static void idpf_vport_intr_napi_add_all(struct idpf_vport *vport) |
| { |
| int (*napi_poll)(struct napi_struct *napi, int budget); |
| u16 v_idx; |
| |
| if (idpf_is_queue_model_split(vport->txq_model)) |
| napi_poll = idpf_vport_splitq_napi_poll; |
| else |
| napi_poll = idpf_vport_singleq_napi_poll; |
| |
| for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) { |
| struct idpf_q_vector *q_vector = &vport->q_vectors[v_idx]; |
| |
| netif_napi_add(vport->netdev, &q_vector->napi, napi_poll); |
| |
| /* only set affinity_mask if the CPU is online */ |
| if (cpu_online(v_idx)) |
| cpumask_set_cpu(v_idx, &q_vector->affinity_mask); |
| } |
| } |
| |
| /** |
| * idpf_vport_intr_alloc - Allocate memory for interrupt vectors |
| * @vport: virtual port |
| * |
| * We allocate one q_vector per queue interrupt. If allocation fails we |
| * return -ENOMEM. |
| */ |
| int idpf_vport_intr_alloc(struct idpf_vport *vport) |
| { |
| u16 txqs_per_vector, rxqs_per_vector, bufqs_per_vector; |
| struct idpf_q_vector *q_vector; |
| int v_idx, err; |
| |
| vport->q_vectors = kcalloc(vport->num_q_vectors, |
| sizeof(struct idpf_q_vector), GFP_KERNEL); |
| if (!vport->q_vectors) |
| return -ENOMEM; |
| |
| txqs_per_vector = DIV_ROUND_UP(vport->num_txq, vport->num_q_vectors); |
| rxqs_per_vector = DIV_ROUND_UP(vport->num_rxq, vport->num_q_vectors); |
| bufqs_per_vector = vport->num_bufqs_per_qgrp * |
| DIV_ROUND_UP(vport->num_rxq_grp, |
| vport->num_q_vectors); |
| |
| for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) { |
| q_vector = &vport->q_vectors[v_idx]; |
| q_vector->vport = vport; |
| |
| q_vector->tx_itr_value = IDPF_ITR_TX_DEF; |
| q_vector->tx_intr_mode = IDPF_ITR_DYNAMIC; |
| q_vector->tx_itr_idx = VIRTCHNL2_ITR_IDX_1; |
| |
| q_vector->rx_itr_value = IDPF_ITR_RX_DEF; |
| q_vector->rx_intr_mode = IDPF_ITR_DYNAMIC; |
| q_vector->rx_itr_idx = VIRTCHNL2_ITR_IDX_0; |
| |
| q_vector->tx = kcalloc(txqs_per_vector, |
| sizeof(struct idpf_queue *), |
| GFP_KERNEL); |
| if (!q_vector->tx) { |
| err = -ENOMEM; |
| goto error; |
| } |
| |
| q_vector->rx = kcalloc(rxqs_per_vector, |
| sizeof(struct idpf_queue *), |
| GFP_KERNEL); |
| if (!q_vector->rx) { |
| err = -ENOMEM; |
| goto error; |
| } |
| |
| if (!idpf_is_queue_model_split(vport->rxq_model)) |
| continue; |
| |
| q_vector->bufq = kcalloc(bufqs_per_vector, |
| sizeof(struct idpf_queue *), |
| GFP_KERNEL); |
| if (!q_vector->bufq) { |
| err = -ENOMEM; |
| goto error; |
| } |
| } |
| |
| return 0; |
| |
| error: |
| idpf_vport_intr_rel(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_vport_intr_init - Setup all vectors for the given vport |
| * @vport: virtual port |
| * |
| * Returns 0 on success or negative on failure |
| */ |
| int idpf_vport_intr_init(struct idpf_vport *vport) |
| { |
| char *int_name; |
| int err; |
| |
| err = idpf_vport_intr_init_vec_idx(vport); |
| if (err) |
| return err; |
| |
| idpf_vport_intr_map_vector_to_qs(vport); |
| idpf_vport_intr_napi_add_all(vport); |
| idpf_vport_intr_napi_ena_all(vport); |
| |
| err = vport->adapter->dev_ops.reg_ops.intr_reg_init(vport); |
| if (err) |
| goto unroll_vectors_alloc; |
| |
| int_name = kasprintf(GFP_KERNEL, "%s-%s", |
| dev_driver_string(&vport->adapter->pdev->dev), |
| vport->netdev->name); |
| |
| err = idpf_vport_intr_req_irq(vport, int_name); |
| if (err) |
| goto unroll_vectors_alloc; |
| |
| idpf_vport_intr_ena_irq_all(vport); |
| |
| return 0; |
| |
| unroll_vectors_alloc: |
| idpf_vport_intr_napi_dis_all(vport); |
| idpf_vport_intr_napi_del_all(vport); |
| |
| return err; |
| } |
| |
| /** |
| * idpf_config_rss - Send virtchnl messages to configure RSS |
| * @vport: virtual port |
| * |
| * Return 0 on success, negative on failure |
| */ |
| int idpf_config_rss(struct idpf_vport *vport) |
| { |
| int err; |
| |
| err = idpf_send_get_set_rss_key_msg(vport, false); |
| if (err) |
| return err; |
| |
| return idpf_send_get_set_rss_lut_msg(vport, false); |
| } |
| |
| /** |
| * idpf_fill_dflt_rss_lut - Fill the indirection table with the default values |
| * @vport: virtual port structure |
| */ |
| static void idpf_fill_dflt_rss_lut(struct idpf_vport *vport) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| u16 num_active_rxq = vport->num_rxq; |
| struct idpf_rss_data *rss_data; |
| int i; |
| |
| rss_data = &adapter->vport_config[vport->idx]->user_config.rss_data; |
| |
| for (i = 0; i < rss_data->rss_lut_size; i++) { |
| rss_data->rss_lut[i] = i % num_active_rxq; |
| rss_data->cached_lut[i] = rss_data->rss_lut[i]; |
| } |
| } |
| |
| /** |
| * idpf_init_rss - Allocate and initialize RSS resources |
| * @vport: virtual port |
| * |
| * Return 0 on success, negative on failure |
| */ |
| int idpf_init_rss(struct idpf_vport *vport) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| struct idpf_rss_data *rss_data; |
| u32 lut_size; |
| |
| rss_data = &adapter->vport_config[vport->idx]->user_config.rss_data; |
| |
| lut_size = rss_data->rss_lut_size * sizeof(u32); |
| rss_data->rss_lut = kzalloc(lut_size, GFP_KERNEL); |
| if (!rss_data->rss_lut) |
| return -ENOMEM; |
| |
| rss_data->cached_lut = kzalloc(lut_size, GFP_KERNEL); |
| if (!rss_data->cached_lut) { |
| kfree(rss_data->rss_lut); |
| rss_data->rss_lut = NULL; |
| |
| return -ENOMEM; |
| } |
| |
| /* Fill the default RSS lut values */ |
| idpf_fill_dflt_rss_lut(vport); |
| |
| return idpf_config_rss(vport); |
| } |
| |
| /** |
| * idpf_deinit_rss - Release RSS resources |
| * @vport: virtual port |
| */ |
| void idpf_deinit_rss(struct idpf_vport *vport) |
| { |
| struct idpf_adapter *adapter = vport->adapter; |
| struct idpf_rss_data *rss_data; |
| |
| rss_data = &adapter->vport_config[vport->idx]->user_config.rss_data; |
| kfree(rss_data->cached_lut); |
| rss_data->cached_lut = NULL; |
| kfree(rss_data->rss_lut); |
| rss_data->rss_lut = NULL; |
| } |