> -----Original Message-----
> From: Xing, Beilei <beilei.x...@intel.com>
> Sent: Friday, April 21, 2023 2:51 PM
> To: Wu, Jingjing <jingjing...@intel.com>
> Cc: dev@dpdk.org; Liu, Mingxia <mingxia....@intel.com>; Xing, Beilei
> <beilei.x...@intel.com>; Wang, Xiao W <xiao.w.w...@intel.com>
> Subject: [PATCH 06/10] net/cpfl: support hairpin queue configuration
>
> From: Beilei Xing <beilei.x...@intel.com>
>
> This patch supports Rx/Tx hairpin queue configuration.
>
> Signed-off-by: Xiao Wang <xiao.w.w...@intel.com>
> Signed-off-by: Mingxia Liu <mingxia....@intel.com>
> Signed-off-by: Beilei Xing <beilei.x...@intel.com>
> ---
> drivers/common/idpf/idpf_common_virtchnl.c | 70 +++++++++++
> drivers/common/idpf/idpf_common_virtchnl.h | 6 +
> drivers/common/idpf/version.map | 2 +
> drivers/net/cpfl/cpfl_ethdev.c | 136 ++++++++++++++++++++-
> drivers/net/cpfl/cpfl_rxtx.c | 80 ++++++++++++
> drivers/net/cpfl/cpfl_rxtx.h | 7 ++
> 6 files changed, 297 insertions(+), 4 deletions(-)
>
> diff --git a/drivers/common/idpf/idpf_common_virtchnl.c
> b/drivers/common/idpf/idpf_common_virtchnl.c
> index 76a658bb26..50cd43a8dd 100644
> --- a/drivers/common/idpf/idpf_common_virtchnl.c
> +++ b/drivers/common/idpf/idpf_common_virtchnl.c
> @@ -1050,6 +1050,41 @@ idpf_vc_rxq_config(struct idpf_vport *vport, struct
> idpf_rx_queue *rxq)
> return err;
> }
>
> +int idpf_vc_rxq_config_by_info(struct idpf_vport *vport, struct
> virtchnl2_rxq_info *rxq_info,
> + uint16_t num_qs)
> +{
> + struct idpf_adapter *adapter = vport->adapter;
> + struct virtchnl2_config_rx_queues *vc_rxqs = NULL;
> + struct idpf_cmd_info args;
> + int size, err, i;
> +
> + size = sizeof(*vc_rxqs) + (num_qs - 1) *
> + sizeof(struct virtchnl2_rxq_info);
> + vc_rxqs = rte_zmalloc("cfg_rxqs", size, 0);
> + if (vc_rxqs == NULL) {
> + DRV_LOG(ERR, "Failed to allocate virtchnl2_config_rx_queues");
> + err = -ENOMEM;
> + return err;
> + }
> + vc_rxqs->vport_id = vport->vport_id;
> + vc_rxqs->num_qinfo = num_qs;
> + memcpy(vc_rxqs->qinfo, rxq_info, num_qs * sizeof(struct
> +virtchnl2_rxq_info));
> +
> + memset(&args, 0, sizeof(args));
> + args.ops = VIRTCHNL2_OP_CONFIG_RX_QUEUES;
> + args.in_args = (uint8_t *)vc_rxqs;
> + args.in_args_size = size;
> + args.out_buffer = adapter->mbx_resp;
> + args.out_size = IDPF_DFLT_MBX_BUF_SIZE;
> +
> + err = idpf_vc_cmd_execute(adapter, &args);
> + rte_free(vc_rxqs);
> + if (err != 0)
> + DRV_LOG(ERR, "Failed to execute command of
> +VIRTCHNL2_OP_CONFIG_RX_QUEUES");
> +
> + return err;
> +}
> +
> int
> idpf_vc_txq_config(struct idpf_vport *vport, struct idpf_tx_queue *txq) {
> @@ -
> 1121,6 +1156,41 @@ idpf_vc_txq_config(struct idpf_vport *vport, struct
> idpf_tx_queue *txq)
> return err;
> }
>
> +int
> +idpf_vc_txq_config_by_info(struct idpf_vport *vport, struct
> virtchnl2_txq_info
> *txq_info,
> + uint16_t num_qs)
> +{
> + struct idpf_adapter *adapter = vport->adapter;
> + struct virtchnl2_config_tx_queues *vc_txqs = NULL;
> + struct idpf_cmd_info args;
> + int size, err;
> +
> + size = sizeof(*vc_txqs) + (num_qs - 1) * sizeof(struct
> virtchnl2_txq_info);
> + vc_txqs = rte_zmalloc("cfg_txqs", size, 0);
> + if (vc_txqs == NULL) {
> + DRV_LOG(ERR, "Failed to allocate virtchnl2_config_tx_queues");
> + err = -ENOMEM;
> + return err;
> + }
> + vc_txqs->vport_id = vport->vport_id;
> + vc_txqs->num_qinfo = num_qs;
> + memcpy(vc_txqs->qinfo, txq_info, num_qs * sizeof(struct
> +virtchnl2_txq_info));
> +
> + memset(&args, 0, sizeof(args));
> + args.ops = VIRTCHNL2_OP_CONFIG_TX_QUEUES;
> + args.in_args = (uint8_t *)vc_txqs;
> + args.in_args_size = size;
> + args.out_buffer = adapter->mbx_resp;
> + args.out_size = IDPF_DFLT_MBX_BUF_SIZE;
> +
> + err = idpf_vc_cmd_execute(adapter, &args);
> + rte_free(vc_txqs);
> + if (err != 0)
> + DRV_LOG(ERR, "Failed to execute command of
> +VIRTCHNL2_OP_CONFIG_TX_QUEUES");
> +
> + return err;
> +}
> +
> int
> idpf_vc_ctlq_recv(struct idpf_ctlq_info *cq, u16 *num_q_msg,
> struct idpf_ctlq_msg *q_msg)
> diff --git a/drivers/common/idpf/idpf_common_virtchnl.h
> b/drivers/common/idpf/idpf_common_virtchnl.h
> index bf1d014c8d..277235ba7d 100644
> --- a/drivers/common/idpf/idpf_common_virtchnl.h
> +++ b/drivers/common/idpf/idpf_common_virtchnl.h
> @@ -65,6 +65,12 @@ __rte_internal
> int idpf_vc_ctlq_post_rx_buffs(struct idpf_hw *hw, struct idpf_ctlq_info *cq,
> u16 *buff_count, struct idpf_dma_mem **buffs);
> __rte_internal
> +int idpf_vc_rxq_config_by_info(struct idpf_vport *vport, struct
> virtchnl2_rxq_info *rxq_info,
> + uint16_t num_qs);
> +__rte_internal
> +int idpf_vc_txq_config_by_info(struct idpf_vport *vport, struct
> virtchnl2_txq_info *txq_info,
> + uint16_t num_qs);
> +__rte_internal
> int idpf_vc_queue_grps_del(struct idpf_vport *vport,
> uint16_t num_q_grps,
> struct virtchnl2_queue_group_id *qg_ids); diff --git
> a/drivers/common/idpf/version.map b/drivers/common/idpf/version.map index
> aa67f7ee27..a339a4bf8e 100644
> --- a/drivers/common/idpf/version.map
> +++ b/drivers/common/idpf/version.map
> @@ -59,8 +59,10 @@ INTERNAL {
> idpf_vc_rss_lut_get;
> idpf_vc_rss_lut_set;
> idpf_vc_rxq_config;
> + idpf_vc_rxq_config_by_info;
> idpf_vc_stats_query;
> idpf_vc_txq_config;
> + idpf_vc_txq_config_by_info;
> idpf_vc_vectors_alloc;
> idpf_vc_vectors_dealloc;
> idpf_vc_vport_create;
> diff --git a/drivers/net/cpfl/cpfl_ethdev.c b/drivers/net/cpfl/cpfl_ethdev.c
> index
> d3300f17cc..13edf2e706 100644
> --- a/drivers/net/cpfl/cpfl_ethdev.c
> +++ b/drivers/net/cpfl/cpfl_ethdev.c
> @@ -737,32 +737,160 @@ cpfl_config_rx_queues_irqs(struct rte_eth_dev *dev)
> return idpf_vport_irq_map_config(vport, nb_rx_queues); }
>
> +/* Update hairpin_info for dev's tx hairpin queue */ static int
> +cpfl_txq_hairpin_info_update(struct rte_eth_dev *dev, uint16_t rx_port)
> +{
> + struct cpfl_vport *cpfl_tx_vport = dev->data->dev_private;
> + struct rte_eth_dev *peer_dev = &rte_eth_devices[rx_port];
> + struct cpfl_vport *cpfl_rx_vport = peer_dev->data->dev_private;
> + struct cpfl_txq_hairpin_info *hairpin_info;
> + struct cpfl_tx_queue *cpfl_txq;
> + int i;
> +
> + for (i = cpfl_tx_vport->nb_data_txq; i < dev->data->nb_tx_queues; i++) {
> + cpfl_txq = dev->data->tx_queues[i];
> + hairpin_info = &cpfl_txq->hairpin_info;
> + if (hairpin_info->peer_rxp != rx_port) {
> + PMD_DRV_LOG(ERR, "port %d is not the peer port",
> rx_port);
> + return -EINVAL;
> + }
> + hairpin_info->peer_rxq_id =
> + cpfl_hw_qid_get(cpfl_rx_vport-
> >p2p_q_chunks_info.rx_start_qid,
> + hairpin_info->peer_rxq_id -
> cpfl_rx_vport->nb_data_rxq);
> + }
> +
> + return 0;
> +}
> +
> +/* Bind Rx hairpin queue's memory zone to peer Tx hairpin queue's
> +memory zone */ static void cpfl_rxq_hairpin_mz_bind(struct rte_eth_dev
> +*dev) {
> + struct cpfl_vport *cpfl_rx_vport = dev->data->dev_private;
> + struct idpf_vport *vport = &cpfl_rx_vport->base;
> + struct idpf_adapter *adapter = vport->adapter;
> + struct idpf_hw *hw = &adapter->hw;
> + struct cpfl_rx_queue *cpfl_rxq;
> + struct cpfl_tx_queue *cpfl_txq;
> + struct rte_eth_dev *peer_dev;
> + const struct rte_memzone *mz;
> + uint16_t peer_tx_port;
> + uint16_t peer_tx_qid;
> + int i;
> +
> + for (i = cpfl_rx_vport->nb_data_rxq; i < dev->data->nb_rx_queues; i++) {
> + cpfl_rxq = dev->data->rx_queues[i];
> + peer_tx_port = cpfl_rxq->hairpin_info.peer_txp;
> + peer_tx_qid = cpfl_rxq->hairpin_info.peer_txq_id;
> + peer_dev = &rte_eth_devices[peer_tx_port];
> + cpfl_txq = peer_dev->data->tx_queues[peer_tx_qid];
> +
> + /* bind rx queue */
> + mz = cpfl_txq->base.mz;
> + cpfl_rxq->base.rx_ring_phys_addr = mz->iova;
> + cpfl_rxq->base.rx_ring = mz->addr;
> + cpfl_rxq->base.mz = mz;
> +
> + /* bind rx buffer queue */
> + mz = cpfl_txq->base.complq->mz;
> + cpfl_rxq->base.bufq1->rx_ring_phys_addr = mz->iova;
> + cpfl_rxq->base.bufq1->rx_ring = mz->addr;
> + cpfl_rxq->base.bufq1->mz = mz;
> + cpfl_rxq->base.bufq1->qrx_tail = hw->hw_addr +
> + cpfl_hw_qtail_get(cpfl_rx_vport-
> >p2p_q_chunks_info.rx_buf_qtail_start,
> + 0, cpfl_rx_vport-
> >p2p_q_chunks_info.rx_buf_qtail_spacing);
> + }
> +}
> +
> static int
> cpfl_start_queues(struct rte_eth_dev *dev) {
> + struct cpfl_vport *cpfl_vport = dev->data->dev_private;
> + struct idpf_vport *vport = &cpfl_vport->base;
> struct cpfl_rx_queue *cpfl_rxq;
> struct cpfl_tx_queue *cpfl_txq;
> + int tx_cmplq_flag = 0;
> + int rx_bufq_flag = 0;
> + int flag = 0;
> int err = 0;
> int i;
>
> + /* For normal data queues, configure, init and enale Txq.
> + * For non-cross vport hairpin queues, configure Txq.
> + */
> for (i = 0; i < dev->data->nb_tx_queues; i++) {
> cpfl_txq = dev->data->tx_queues[i];
> if (cpfl_txq == NULL || cpfl_txq->base.tx_deferred_start)
> continue;
> - err = cpfl_tx_queue_start(dev, i);
> + if (!cpfl_txq->hairpin_info.hairpin_q) {
> + err = cpfl_tx_queue_start(dev, i);
> + if (err != 0) {
> + PMD_DRV_LOG(ERR, "Fail to start Tx
> queue %u", i);
> + return err;
> + }
> + } else if (!cpfl_txq->hairpin_info.manual_bind) {
> + if (flag == 0) {
> + err = cpfl_txq_hairpin_info_update(dev,
> + cpfl_txq-
> >hairpin_info.peer_rxp);
> + if (err != 0) {
> + PMD_DRV_LOG(ERR, "Fail to update Tx
> hairpin queue info");
> + return err;
> + }
> + flag = 1;
[Liu, Mingxia] The variable flag is not been used, can it be removed?
> + }
> + err = cpfl_hairpin_txq_config(vport, cpfl_txq);
> + if (err != 0) {
> + PMD_DRV_LOG(ERR, "Fail to configure hairpin
> Tx queue %u", i);
> + return err;
> + }
> + tx_cmplq_flag = 1;
> + }
> + }
> +
> + /* For non-cross vport hairpin queues, configure Tx completion queue
> first.*/
> + if (tx_cmplq_flag == 1 && cpfl_vport->p2p_tx_complq != NULL) {
> + err = cpfl_hairpin_tx_complq_config(cpfl_vport);
> if (err != 0) {
> - PMD_DRV_LOG(ERR, "Fail to start Tx queue %u", i);
> + PMD_DRV_LOG(ERR, "Fail to config Tx completion
> queue");
> return err;
> }
> }
>
[Liu, Mingxia] Better to move this code next to
+ err = cpfl_hairpin_txq_config(vport, cpfl_txq);
+ if (err != 0) {
+ PMD_DRV_LOG(ERR, "Fail to configure hairpin Tx
queue %u", i);
+ return err;
+ }
When cpfl_rxq->hairpin_info.hairpin_q is true, then cpfl_vport->p2p_tx_complq
is not null, right ?
And remove tx_cmplq_flag?
> + /* For normal data queues, configure, init and enale Rxq.
> + * For non-cross vport hairpin queues, configure Rxq, and then init Rxq.
> + */
> + cpfl_rxq_hairpin_mz_bind(dev);
> for (i = 0; i < dev->data->nb_rx_queues; i++) {
> cpfl_rxq = dev->data->rx_queues[i];
> if (cpfl_rxq == NULL || cpfl_rxq->base.rx_deferred_start)
> continue;
> - err = cpfl_rx_queue_start(dev, i);
> + if (!cpfl_rxq->hairpin_info.hairpin_q) {
> + err = cpfl_rx_queue_start(dev, i);
> + if (err != 0) {
> + PMD_DRV_LOG(ERR, "Fail to start Rx
> queue %u", i);
> + return err;
> + }
> + } else if (!cpfl_rxq->hairpin_info.manual_bind) {
> + err = cpfl_hairpin_rxq_config(vport, cpfl_rxq);
> + if (err != 0) {
> + PMD_DRV_LOG(ERR, "Fail to configure hairpin
> Rx queue %u", i);
> + return err;
> + }
> + err = cpfl_rx_queue_init(dev, i);
> + if (err != 0) {
> + PMD_DRV_LOG(ERR, "Fail to init hairpin Rx
> queue %u", i);
> + return err;
> + }
> + rx_bufq_flag = 1;
> + }
> + }
> +
> + /* For non-cross vport hairpin queues, configure Rx buffer queue.*/
> + if (rx_bufq_flag == 1 && cpfl_vport->p2p_rx_bufq != NULL) {
> + err = cpfl_hairpin_rx_bufq_config(cpfl_vport);
> if (err != 0) {
> - PMD_DRV_LOG(ERR, "Fail to start Rx queue %u", i);
> + PMD_DRV_LOG(ERR, "Fail to config Rx buffer queue");
> return err;
> }
> }
[Liu, Mingxia] Similar to above.
> diff --git a/drivers/net/cpfl/cpfl_rxtx.c b/drivers/net/cpfl/cpfl_rxtx.c index
> 64ed331a6d..040beb5bac 100644
> --- a/drivers/net/cpfl/cpfl_rxtx.c
> +++ b/drivers/net/cpfl/cpfl_rxtx.c
> @@ -930,6 +930,86 @@ cpfl_tx_hairpin_queue_setup(struct rte_eth_dev *dev,
> uint16_t queue_idx,
> return 0;
> }
>
> +int
> +cpfl_hairpin_rx_bufq_config(struct cpfl_vport *cpfl_vport) {
> + struct idpf_rx_queue *rx_bufq = cpfl_vport->p2p_rx_bufq;
> + struct virtchnl2_rxq_info rxq_info[1] = {0};
> +
> + rxq_info[0].type = VIRTCHNL2_QUEUE_TYPE_RX_BUFFER;
> + rxq_info[0].queue_id = rx_bufq->queue_id;
> + rxq_info[0].ring_len = rx_bufq->nb_rx_desc;
> + rxq_info[0].dma_ring_addr = rx_bufq->rx_ring_phys_addr;
> + rxq_info[0].desc_ids = VIRTCHNL2_RXDID_2_FLEX_SPLITQ_M;
> + rxq_info[0].rx_buffer_low_watermark =
> CPFL_RXBUF_LOW_WATERMARK;
> + rxq_info[0].model = VIRTCHNL2_QUEUE_MODEL_SPLIT;
> + rxq_info[0].data_buffer_size = rx_bufq->rx_buf_len;
> + rxq_info[0].buffer_notif_stride = CPFL_RX_BUF_STRIDE;
> +
> + return idpf_vc_rxq_config_by_info(&cpfl_vport->base, rxq_info, 1); }
> +
> +int
> +cpfl_hairpin_rxq_config(struct idpf_vport *vport, struct cpfl_rx_queue
> +*cpfl_rxq) {
> + struct virtchnl2_rxq_info rxq_info[1] = {0};
> + struct idpf_rx_queue *rxq = &cpfl_rxq->base;
> +
> + rxq_info[0].type = VIRTCHNL2_QUEUE_TYPE_RX;
> + rxq_info[0].queue_id = rxq->queue_id;
> + rxq_info[0].ring_len = rxq->nb_rx_desc;
> + rxq_info[0].dma_ring_addr = rxq->rx_ring_phys_addr;
> + rxq_info[0].rx_bufq1_id = rxq->bufq1->queue_id;
> + rxq_info[0].max_pkt_size = vport->max_pkt_len;
> + rxq_info[0].desc_ids = VIRTCHNL2_RXDID_2_FLEX_SPLITQ_M;
> + rxq_info[0].qflags |= VIRTCHNL2_RX_DESC_SIZE_16BYTE;
> +
> + rxq_info[0].data_buffer_size = rxq->rx_buf_len;
> + rxq_info[0].model = VIRTCHNL2_QUEUE_MODEL_SPLIT;
> + rxq_info[0].rx_buffer_low_watermark =
> CPFL_RXBUF_LOW_WATERMARK;
> +
> + PMD_DRV_LOG(NOTICE, "hairpin: vport %u, Rxq id 0x%x",
> + vport->vport_id, rxq_info[0].queue_id);
> +
> + return idpf_vc_rxq_config_by_info(vport, rxq_info, 1); }
> +
> +int
> +cpfl_hairpin_tx_complq_config(struct cpfl_vport *cpfl_vport) {
> + struct idpf_tx_queue *tx_complq = cpfl_vport->p2p_tx_complq;
> + struct virtchnl2_txq_info txq_info[1] = {0};
> +
> + txq_info[0].dma_ring_addr = tx_complq->tx_ring_phys_addr;
> + txq_info[0].type = VIRTCHNL2_QUEUE_TYPE_TX_COMPLETION;
> + txq_info[0].queue_id = tx_complq->queue_id;
> + txq_info[0].ring_len = tx_complq->nb_tx_desc;
> + txq_info[0].peer_rx_queue_id = cpfl_vport->p2p_rx_bufq->queue_id;
> + txq_info[0].model = VIRTCHNL2_QUEUE_MODEL_SPLIT;
> + txq_info[0].sched_mode = VIRTCHNL2_TXQ_SCHED_MODE_FLOW;
> +
> + return idpf_vc_txq_config_by_info(&cpfl_vport->base, txq_info, 1); }
> +
> +int
> +cpfl_hairpin_txq_config(struct idpf_vport *vport, struct cpfl_tx_queue
> +*cpfl_txq) {
> + struct idpf_tx_queue *txq = &cpfl_txq->base;
> + struct virtchnl2_txq_info txq_info[1] = {0};
> +
> + txq_info[0].dma_ring_addr = txq->tx_ring_phys_addr;
> + txq_info[0].type = VIRTCHNL2_QUEUE_TYPE_TX;
> + txq_info[0].queue_id = txq->queue_id;
> + txq_info[0].ring_len = txq->nb_tx_desc;
> + txq_info[0].tx_compl_queue_id = txq->complq->queue_id;
> + txq_info[0].relative_queue_id = txq->queue_id;
> + txq_info[0].peer_rx_queue_id = cpfl_txq->hairpin_info.peer_rxq_id;
> + txq_info[0].model = VIRTCHNL2_QUEUE_MODEL_SPLIT;
> + txq_info[0].sched_mode = VIRTCHNL2_TXQ_SCHED_MODE_FLOW;
> +
> + return idpf_vc_txq_config_by_info(vport, txq_info, 1); }
> +
> int
> cpfl_rx_queue_init(struct rte_eth_dev *dev, uint16_t rx_queue_id) { diff
> --git
> a/drivers/net/cpfl/cpfl_rxtx.h b/drivers/net/cpfl/cpfl_rxtx.h index
> d844c9f057..b01ce5edf9 100644
> --- a/drivers/net/cpfl/cpfl_rxtx.h
> +++ b/drivers/net/cpfl/cpfl_rxtx.h
> @@ -30,12 +30,15 @@
> #define CPFL_RING_BASE_ALIGN 128
>
> #define CPFL_DEFAULT_RX_FREE_THRESH 32
> +#define CPFL_RXBUF_LOW_WATERMARK 64
>
> #define CPFL_DEFAULT_TX_RS_THRESH 32
> #define CPFL_DEFAULT_TX_FREE_THRESH 32
>
> #define CPFL_SUPPORT_CHAIN_NUM 5
>
> +#define CPFL_RX_BUF_STRIDE 64
> +
> struct cpfl_rxq_hairpin_info {
> bool hairpin_q; /* if rx queue is a hairpin queue */
> bool manual_bind; /* for cross vport */
> @@ -85,4 +88,8 @@ int cpfl_rx_hairpin_queue_setup(struct rte_eth_dev *dev,
> uint16_t queue_idx, int cpfl_tx_hairpin_queue_setup(struct rte_eth_dev *dev,
> uint16_t queue_idx,
> uint16_t nb_desc,
> const struct rte_eth_hairpin_conf *conf);
> +int cpfl_hairpin_tx_complq_config(struct cpfl_vport *cpfl_vport); int
> +cpfl_hairpin_txq_config(struct idpf_vport *vport, struct cpfl_tx_queue
> +*cpfl_txq); int cpfl_hairpin_rx_bufq_config(struct cpfl_vport
> +*cpfl_vport); int cpfl_hairpin_rxq_config(struct idpf_vport *vport,
> +struct cpfl_rx_queue *cpfl_rxq);
> #endif /* _CPFL_RXTX_H_ */
> --
> 2.26.2