From: Dawid Gorecki <d...@semihalf.com>

Add support for RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE offload. It can be
enabled if all the mbufs for a given queue belong to the same mempool
and their reference count is equal to 1.

Signed-off-by: Dawid Gorecki <d...@semihalf.com>
Reviewed-by: Michal Krawczyk <m...@semihalf.com>
Reviewed-by: Shai Brandes <shaib...@amazon.com>
Reviewed-by: Amit Bernstein <amitb...@amazon.com>
---
 doc/guides/nics/features/ena.ini       |  1 +
 doc/guides/rel_notes/release_22_07.rst |  7 ++++
 drivers/net/ena/ena_ethdev.c           | 49 ++++++++++++++++++++++++--
 3 files changed, 55 insertions(+), 2 deletions(-)

diff --git a/doc/guides/nics/features/ena.ini b/doc/guides/nics/features/ena.ini
index 59c1ae85fa..1fe7a71e3d 100644
--- a/doc/guides/nics/features/ena.ini
+++ b/doc/guides/nics/features/ena.ini
@@ -7,6 +7,7 @@
 Link status          = Y
 Link status event    = Y
 Rx interrupt         = Y
+Fast mbuf free       = Y
 Free Tx mbuf on demand = Y
 MTU update           = Y
 Scattered Rx         = Y
diff --git a/doc/guides/rel_notes/release_22_07.rst 
b/doc/guides/rel_notes/release_22_07.rst
index d46f773df0..73f566e5fc 100644
--- a/doc/guides/rel_notes/release_22_07.rst
+++ b/doc/guides/rel_notes/release_22_07.rst
@@ -87,6 +87,13 @@ New Features
 
   Added an API which can get the device type of vDPA device.
 
+
+* **Updated Amazon ena driver.**
+
+  The new driver version (v2.7.0) includes:
+
+  * Added fast mbuf free feature support.
+
 * **Updated Intel iavf driver.**
 
   * Added Tx QoS queue rate limitation support.
diff --git a/drivers/net/ena/ena_ethdev.c b/drivers/net/ena/ena_ethdev.c
index 68768cab70..68a4478410 100644
--- a/drivers/net/ena/ena_ethdev.c
+++ b/drivers/net/ena/ena_ethdev.c
@@ -36,6 +36,12 @@
 
 #define ENA_MIN_RING_DESC      128
 
+/*
+ * We should try to keep ENA_CLEANUP_BUF_SIZE lower than
+ * RTE_MEMPOOL_CACHE_MAX_SIZE, so we can fit this in mempool local cache.
+ */
+#define ENA_CLEANUP_BUF_SIZE   256
+
 #define ENA_PTYPE_HAS_HASH     (RTE_PTYPE_L4_TCP | RTE_PTYPE_L4_UDP)
 
 struct ena_stats {
@@ -2402,6 +2408,8 @@ static uint64_t ena_get_tx_port_offloads(struct 
ena_adapter *adapter)
 
        port_offloads |= RTE_ETH_TX_OFFLOAD_MULTI_SEGS;
 
+       port_offloads |= RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE;
+
        return port_offloads;
 }
 
@@ -2414,9 +2422,12 @@ static uint64_t ena_get_rx_queue_offloads(struct 
ena_adapter *adapter)
 
 static uint64_t ena_get_tx_queue_offloads(struct ena_adapter *adapter)
 {
+       uint64_t queue_offloads = 0;
        RTE_SET_USED(adapter);
 
-       return 0;
+       queue_offloads |= RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE;
+
+       return queue_offloads;
 }
 
 static int ena_infos_get(struct rte_eth_dev *dev,
@@ -3001,13 +3012,38 @@ static int ena_xmit_mbuf(struct ena_ring *tx_ring, 
struct rte_mbuf *mbuf)
        return 0;
 }
 
+static __rte_always_inline size_t
+ena_tx_cleanup_mbuf_fast(struct rte_mbuf **mbufs_to_clean,
+                        struct rte_mbuf *mbuf,
+                        size_t mbuf_cnt,
+                        size_t buf_size)
+{
+       struct rte_mbuf *m_next;
+
+       while (mbuf != NULL) {
+               m_next = mbuf->next;
+               mbufs_to_clean[mbuf_cnt++] = mbuf;
+               if (mbuf_cnt == buf_size) {
+                       rte_mempool_put_bulk(mbufs_to_clean[0]->pool, (void 
**)mbufs_to_clean,
+                               (unsigned int)mbuf_cnt);
+                       mbuf_cnt = 0;
+               }
+               mbuf = m_next;
+       }
+
+       return mbuf_cnt;
+}
+
 static int ena_tx_cleanup(void *txp, uint32_t free_pkt_cnt)
 {
+       struct rte_mbuf *mbufs_to_clean[ENA_CLEANUP_BUF_SIZE];
        struct ena_ring *tx_ring = (struct ena_ring *)txp;
+       size_t mbuf_cnt = 0;
        unsigned int total_tx_descs = 0;
        unsigned int total_tx_pkts = 0;
        uint16_t cleanup_budget;
        uint16_t next_to_clean = tx_ring->next_to_clean;
+       bool fast_free = tx_ring->offloads & RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE;
 
        /*
         * If free_pkt_cnt is equal to 0, it means that the user requested
@@ -3032,7 +3068,12 @@ static int ena_tx_cleanup(void *txp, uint32_t 
free_pkt_cnt)
                tx_info->timestamp = 0;
 
                mbuf = tx_info->mbuf;
-               rte_pktmbuf_free(mbuf);
+               if (fast_free) {
+                       mbuf_cnt = ena_tx_cleanup_mbuf_fast(mbufs_to_clean, 
mbuf, mbuf_cnt,
+                               ENA_CLEANUP_BUF_SIZE);
+               } else {
+                       rte_pktmbuf_free(mbuf);
+               }
 
                tx_info->mbuf = NULL;
                tx_ring->empty_tx_reqs[next_to_clean] = req_id;
@@ -3052,6 +3093,10 @@ static int ena_tx_cleanup(void *txp, uint32_t 
free_pkt_cnt)
                ena_com_update_dev_comp_head(tx_ring->ena_com_io_cq);
        }
 
+       if (mbuf_cnt != 0)
+               rte_mempool_put_bulk(mbufs_to_clean[0]->pool,
+                       (void **)mbufs_to_clean, mbuf_cnt);
+
        /* Notify completion handler that full cleanup was performed */
        if (free_pkt_cnt == 0 || total_tx_pkts < cleanup_budget)
                tx_ring->last_cleanup_ticks = rte_get_timer_cycles();
-- 
2.25.1

Reply via email to