Add support to the i40e driver for the API rte_eth_tx_done_cleanup
to force free consumed buffers on Tx ring.

Signed-off-by: Chenxu Di <chenxux...@intel.com>
---
 drivers/net/i40e/i40e_ethdev.c    |   3 +
 drivers/net/i40e/i40e_ethdev_vf.c |   3 +
 drivers/net/i40e/i40e_rxtx.c      | 151 ++++++++++++++++++++++++++++++
 drivers/net/i40e/i40e_rxtx.h      |   8 ++
 4 files changed, 165 insertions(+)

diff --git a/drivers/net/i40e/i40e_ethdev.c b/drivers/net/i40e/i40e_ethdev.c
index 5999c964b..e0b071891 100644
--- a/drivers/net/i40e/i40e_ethdev.c
+++ b/drivers/net/i40e/i40e_ethdev.c
@@ -522,6 +522,7 @@ static const struct eth_dev_ops i40e_eth_dev_ops = {
        .mac_addr_set                 = i40e_set_default_mac_addr,
        .mtu_set                      = i40e_dev_mtu_set,
        .tm_ops_get                   = i40e_tm_ops_get,
+       .tx_done_cleanup              = i40e_tx_done_cleanup,
 };
 
 /* store statistics names and its offset in stats structure */
@@ -1358,6 +1359,8 @@ eth_i40e_dev_init(struct rte_eth_dev *dev, void 
*init_params __rte_unused)
        dev->tx_pkt_burst = i40e_xmit_pkts;
        dev->tx_pkt_prepare = i40e_prep_pkts;
 
+       i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_scalar);
+
        /* for secondary processes, we don't initialise any further as primary
         * has already done this work. Only check we don't need a different
         * RX function */
diff --git a/drivers/net/i40e/i40e_ethdev_vf.c 
b/drivers/net/i40e/i40e_ethdev_vf.c
index 5dba0928b..3dcc9434c 100644
--- a/drivers/net/i40e/i40e_ethdev_vf.c
+++ b/drivers/net/i40e/i40e_ethdev_vf.c
@@ -215,6 +215,7 @@ static const struct eth_dev_ops i40evf_eth_dev_ops = {
        .rss_hash_conf_get    = i40evf_dev_rss_hash_conf_get,
        .mtu_set              = i40evf_dev_mtu_set,
        .mac_addr_set         = i40evf_set_default_mac_addr,
+       .tx_done_cleanup      = i40e_tx_done_cleanup,
 };
 
 /*
@@ -1473,6 +1474,8 @@ i40evf_dev_init(struct rte_eth_dev *eth_dev)
        eth_dev->rx_pkt_burst = &i40e_recv_pkts;
        eth_dev->tx_pkt_burst = &i40e_xmit_pkts;
 
+       i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_scalar);
+
        /*
         * For secondary processes, we don't initialise any further as primary
         * has already done this work.
diff --git a/drivers/net/i40e/i40e_rxtx.c b/drivers/net/i40e/i40e_rxtx.c
index 17dc8c78f..dfbca06b6 100644
--- a/drivers/net/i40e/i40e_rxtx.c
+++ b/drivers/net/i40e/i40e_rxtx.c
@@ -2455,6 +2455,154 @@ i40e_tx_queue_release_mbufs(struct i40e_tx_queue *txq)
        }
 }
 
+static i40e_tx_done_cleanup_t i40e_tx_done_cleanup_op;
+
+int
+i40e_tx_done_cleanup_scalar(struct i40e_tx_queue *txq,
+                       uint32_t free_cnt)
+{
+       uint32_t pkt_cnt;
+       uint16_t i;
+       uint16_t tx_last;
+       uint16_t tx_id;
+       uint16_t nb_tx_to_clean;
+       uint16_t nb_tx_free_last;
+       struct i40e_tx_entry *swr_ring = txq->sw_ring;
+
+       /* Start free mbuf from the next of tx_tail */
+       tx_last = txq->tx_tail;
+       tx_id  = swr_ring[tx_last].next_id;
+
+       if (txq->nb_tx_free == 0)
+               if (i40e_xmit_cleanup(txq))
+                       return 0;
+
+       nb_tx_to_clean = txq->nb_tx_free;
+       nb_tx_free_last = txq->nb_tx_free;
+       if (!free_cnt)
+               free_cnt = txq->nb_tx_desc;
+
+       /* Loop through swr_ring to count the amount of
+        * freeable mubfs and packets.
+        */
+       for (pkt_cnt = 0; pkt_cnt < free_cnt; ) {
+               for (i = 0; i < nb_tx_to_clean &&
+                       pkt_cnt < free_cnt &&
+                       tx_id != tx_last; i++) {
+                       if (swr_ring[tx_id].mbuf != NULL) {
+                               rte_pktmbuf_free_seg(swr_ring[tx_id].mbuf);
+                               swr_ring[tx_id].mbuf = NULL;
+
+                               /*
+                                * last segment in the packet,
+                                * increment packet count
+                                */
+                               pkt_cnt += (swr_ring[tx_id].last_id == tx_id);
+                       }
+
+                       tx_id = swr_ring[tx_id].next_id;
+               }
+
+               if (tx_id == tx_last || txq->tx_rs_thresh
+                       > txq->nb_tx_desc - txq->nb_tx_free)
+                       break;
+
+               if (pkt_cnt < free_cnt) {
+                       if (i40e_xmit_cleanup(txq))
+                               break;
+
+                       nb_tx_to_clean = txq->nb_tx_free - nb_tx_free_last;
+                       nb_tx_free_last = txq->nb_tx_free;
+               }
+       }
+
+       PMD_TX_FREE_LOG(DEBUG,
+               "Free %u Packets successfully "
+               "(port=%d queue=%d)",
+               pkt_cnt, txq->port_id, txq->queue_id);
+
+       return (int)pkt_cnt;
+}
+
+int
+i40e_tx_done_cleanup_simple(struct i40e_tx_queue *txq,
+                       uint32_t free_cnt)
+{
+       uint16_t i;
+       uint16_t tx_first;
+       uint16_t tx_id;
+       uint32_t pkt_cnt;
+       struct i40e_tx_entry *swr_ring = txq->sw_ring;
+
+       /* Start free mbuf from tx_first */
+       tx_first = txq->tx_next_dd - (txq->tx_rs_thresh - 1);
+       tx_id  = tx_first;
+
+       /* while free_cnt is 0,
+        * suppose one mbuf per packet,
+        * try to free packets as many as possible
+        */
+       if (free_cnt == 0)
+               free_cnt = txq->nb_tx_desc;
+
+       /* Loop through swr_ring to count freeable packets */
+       for (pkt_cnt = 0; pkt_cnt < free_cnt; ) {
+               if (txq->nb_tx_desc - txq->nb_tx_free < txq->tx_rs_thresh)
+                       break;
+
+               if (!i40e_tx_free_bufs(txq))
+                       break;
+
+               for (i = 0; i != txq->tx_rs_thresh &&
+                       tx_id != tx_first; i++) {
+                       /* last segment in the packet,
+                        * increment packet count
+                        */
+                       pkt_cnt += (tx_id == swr_ring[tx_id].last_id);
+                       tx_id = swr_ring[tx_id].next_id;
+               }
+
+               if (tx_id == tx_first)
+                       break;
+       }
+
+       PMD_TX_FREE_LOG(DEBUG,
+               "Free %u packets successfully "
+               "(port=%d queue=%d)",
+               pkt_cnt, txq->port_id, txq->queue_id);
+
+       return (int)pkt_cnt;
+}
+
+int
+i40e_tx_done_cleanup_vec(struct i40e_tx_queue *txq __rte_unused,
+                       uint32_t free_cnt __rte_unused)
+{
+       return -ENOTSUP;
+}
+int
+i40e_tx_done_cleanup(void *txq, uint32_t free_cnt)
+{
+       i40e_tx_done_cleanup_t func = i40e_get_tx_done_cleanup_func();
+
+       if (!func)
+               return -ENOTSUP;
+
+       return func(txq, free_cnt);
+}
+
+void
+i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_t fn)
+{
+       i40e_tx_done_cleanup_op = fn;
+}
+
+i40e_tx_done_cleanup_t
+i40e_get_tx_done_cleanup_func(void)
+{
+       return i40e_tx_done_cleanup_op;
+}
+
 void
 i40e_reset_tx_queue(struct i40e_tx_queue *txq)
 {
@@ -3139,15 +3287,18 @@ i40e_set_tx_function(struct rte_eth_dev *dev)
                        else
                                dev->tx_pkt_burst =
                                        i40e_get_recommend_tx_vec();
+                       i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_vec);
                } else {
                        PMD_INIT_LOG(DEBUG, "Simple tx finally be used.");
                        dev->tx_pkt_burst = i40e_xmit_pkts_simple;
+                       
i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_simple);
                }
                dev->tx_pkt_prepare = NULL;
        } else {
                PMD_INIT_LOG(DEBUG, "Xmit tx finally be used.");
                dev->tx_pkt_burst = i40e_xmit_pkts;
                dev->tx_pkt_prepare = i40e_prep_pkts;
+               i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_scalar);
        }
 }
 
diff --git a/drivers/net/i40e/i40e_rxtx.h b/drivers/net/i40e/i40e_rxtx.h
index 2106bb355..ab2c0ffd0 100644
--- a/drivers/net/i40e/i40e_rxtx.h
+++ b/drivers/net/i40e/i40e_rxtx.h
@@ -173,6 +173,8 @@ union i40e_tx_offload {
                uint64_t outer_l3_len:16; /**< outer L3 Header Length */
        };
 };
+typedef int (*i40e_tx_done_cleanup_t)(struct i40e_tx_queue *txq,
+                               uint32_t free_cnt);
 
 int i40e_dev_rx_queue_start(struct rte_eth_dev *dev, uint16_t rx_queue_id);
 int i40e_dev_rx_queue_stop(struct rte_eth_dev *dev, uint16_t rx_queue_id);
@@ -212,6 +214,12 @@ void i40e_dev_free_queues(struct rte_eth_dev *dev);
 void i40e_reset_rx_queue(struct i40e_rx_queue *rxq);
 void i40e_reset_tx_queue(struct i40e_tx_queue *txq);
 void i40e_tx_queue_release_mbufs(struct i40e_tx_queue *txq);
+void i40e_set_tx_done_cleanup_func(i40e_tx_done_cleanup_t fn);
+i40e_tx_done_cleanup_t i40e_get_tx_done_cleanup_func(void);
+int i40e_tx_done_cleanup(void *txq, uint32_t free_cnt);
+int i40e_tx_done_cleanup_scalar(struct i40e_tx_queue *txq, uint32_t free_cnt);
+int i40e_tx_done_cleanup_vec(struct i40e_tx_queue *txq, uint32_t free_cnt);
+int i40e_tx_done_cleanup_simple(struct i40e_tx_queue *txq, uint32_t free_cnt);
 int i40e_alloc_rx_queue_mbufs(struct i40e_rx_queue *rxq);
 void i40e_rx_queue_release_mbufs(struct i40e_rx_queue *rxq);
 
-- 
2.17.1

Reply via email to