From: Moti Haimovsky <mo...@mellanox.com>

This patch adds loopback functionality used when the chip is a VF in order
to enable packet transmission between VFs and PF.

Signed-off-by: Moti Haimovsky <mo...@mellanox.com>
Acked-by: Adrien Mazarguil <adrien.mazarg...@6wind.com>
---
 drivers/net/mlx4/mlx4_rxtx.c | 33 +++++++++++++++++++++------------
 drivers/net/mlx4/mlx4_rxtx.h |  1 +
 drivers/net/mlx4/mlx4_txq.c  |  2 ++
 3 files changed, 24 insertions(+), 12 deletions(-)

diff --git a/drivers/net/mlx4/mlx4_rxtx.c b/drivers/net/mlx4/mlx4_rxtx.c
index 87c5261..36173ad 100644
--- a/drivers/net/mlx4/mlx4_rxtx.c
+++ b/drivers/net/mlx4/mlx4_rxtx.c
@@ -311,10 +311,13 @@ struct pv {
        struct mlx4_wqe_data_seg *dseg;
        struct mlx4_sq *sq = &txq->msq;
        struct rte_mbuf *buf;
+       union {
+               uint32_t flags;
+               uint16_t flags16[2];
+       } srcrb;
        uint32_t head_idx = sq->head & sq->txbb_cnt_mask;
        uint32_t lkey;
        uintptr_t addr;
-       uint32_t srcrb_flags;
        uint32_t owner_opcode = MLX4_OPCODE_SEND;
        uint32_t byte_count;
        int wqe_real_size;
@@ -414,22 +417,16 @@ struct pv {
        /* Fill the control parameters for this packet. */
        ctrl->fence_size = (wqe_real_size >> 4) & 0x3f;
        /*
-        * The caller should prepare "imm" in advance in order to support
-        * VF to VF communication (when the device is a virtual-function
-        * device (VF)).
-        */
-       ctrl->imm = 0;
-       /*
         * For raw Ethernet, the SOLICIT flag is used to indicate that no ICRC
         * should be calculated.
         */
        txq->elts_comp_cd -= nr_txbbs;
        if (unlikely(txq->elts_comp_cd <= 0)) {
                txq->elts_comp_cd = txq->elts_comp_cd_init;
-               srcrb_flags = RTE_BE32(MLX4_WQE_CTRL_SOLICIT |
+               srcrb.flags = RTE_BE32(MLX4_WQE_CTRL_SOLICIT |
                                       MLX4_WQE_CTRL_CQ_UPDATE);
        } else {
-               srcrb_flags = RTE_BE32(MLX4_WQE_CTRL_SOLICIT);
+               srcrb.flags = RTE_BE32(MLX4_WQE_CTRL_SOLICIT);
        }
        /* Enable HW checksum offload if requested */
        if (txq->csum &&
@@ -443,14 +440,26 @@ struct pv {
                        owner_opcode |= MLX4_WQE_CTRL_IIP_HDR_CSUM |
                                        MLX4_WQE_CTRL_IL4_HDR_CSUM;
                        if (pkt->ol_flags & PKT_TX_OUTER_IP_CKSUM)
-                               srcrb_flags |=
+                               srcrb.flags |=
                                        RTE_BE32(MLX4_WQE_CTRL_IP_HDR_CSUM);
                } else {
-                       srcrb_flags |= RTE_BE32(MLX4_WQE_CTRL_IP_HDR_CSUM |
+                       srcrb.flags |= RTE_BE32(MLX4_WQE_CTRL_IP_HDR_CSUM |
                                                MLX4_WQE_CTRL_TCP_UDP_CSUM);
                }
        }
-       ctrl->srcrb_flags = srcrb_flags;
+       if (txq->lb) {
+               /*
+                * Copy destination MAC address to the WQE, this allows
+                * loopback in eSwitch, so that VFs and PF can communicate
+                * with each other.
+                */
+               srcrb.flags16[0] = *(rte_pktmbuf_mtod(pkt, uint16_t *));
+               ctrl->imm = *(rte_pktmbuf_mtod_offset(pkt, uint32_t *,
+                                                     sizeof(uint16_t)));
+       } else {
+               ctrl->imm = 0;
+       }
+       ctrl->srcrb_flags = srcrb.flags;
        /*
         * Make sure descriptor is fully written before
         * setting ownership bit (because HW can start
diff --git a/drivers/net/mlx4/mlx4_rxtx.h b/drivers/net/mlx4/mlx4_rxtx.h
index 6aad41a..37f31f4 100644
--- a/drivers/net/mlx4/mlx4_rxtx.h
+++ b/drivers/net/mlx4/mlx4_rxtx.h
@@ -112,6 +112,7 @@ struct txq {
        uint32_t max_inline; /**< Max inline send size. */
        uint32_t csum:1; /**< Enable checksum offloading. */
        uint32_t csum_l2tun:1; /**< Same for L2 tunnels. */
+       uint32_t lb:1; /**< Whether packets should be looped back by eSwitch. */
        uint8_t *bounce_buf;
        /**< Memory used for storing the first DWORD of data TXBBs. */
        struct {
diff --git a/drivers/net/mlx4/mlx4_txq.c b/drivers/net/mlx4/mlx4_txq.c
index 96429bc..9d1be95 100644
--- a/drivers/net/mlx4/mlx4_txq.c
+++ b/drivers/net/mlx4/mlx4_txq.c
@@ -412,6 +412,8 @@ struct txq_mp2mr_mbuf_check_data {
                      (void *)dev, strerror(rte_errno));
                goto error;
        }
+       /* Enable Tx loopback for VF devices. */
+       tmpl.lb = !!(priv->vf);
        /* Clean up txq in case we're reinitializing it. */
        DEBUG("%p: cleaning-up old txq just in case", (void *)txq);
        mlx4_txq_cleanup(txq);
-- 
1.8.3.1

Reply via email to