[dpdk-dev] [PATCH v4 2/5] net/tap: fix mbuf and mem leak during queue release

2020-04-11 Thread wangyunjian
From: Yunjian Wang 

For the tap PMD, we should release mbufs and iovecs from the Rx queue when
closing device. In order to remove duplicated code, rte_pmd_tap_remove()
calls tap_dev_close().

Fixes: 0781f5762cfe ("net/tap: support segmented mbufs")
CC: sta...@dpdk.org

Signed-off-by: Yunjian Wang 
---
 drivers/net/tap/rte_eth_tap.c | 36 ++-
 1 file changed, 14 insertions(+), 22 deletions(-)

diff --git a/drivers/net/tap/rte_eth_tap.c b/drivers/net/tap/rte_eth_tap.c
index 3f4042e5b..0156d689d 100644
--- a/drivers/net/tap/rte_eth_tap.c
+++ b/drivers/net/tap/rte_eth_tap.c
@@ -1023,15 +1023,25 @@ tap_dev_close(struct rte_eth_dev *dev)
int i;
struct pmd_internals *internals = dev->data->dev_private;
struct pmd_process_private *process_private = dev->process_private;
+   struct rx_queue *rxq;
 
tap_link_set_down(dev);
-   tap_flow_flush(dev, NULL);
-   tap_flow_implicit_flush(internals, NULL);
+   if (internals->nlsk_fd != -1) {
+   tap_flow_flush(dev, NULL);
+   tap_flow_implicit_flush(internals, NULL);
+   tap_nl_final(internals->nlsk_fd);
+   internals->nlsk_fd = -1;
+   }
 
for (i = 0; i < RTE_PMD_TAP_MAX_QUEUES; i++) {
if (process_private->rxq_fds[i] != -1) {
+   rxq = &internals->rxq[i];
close(process_private->rxq_fds[i]);
process_private->rxq_fds[i] = -1;
+   rte_pktmbuf_free(rxq->pool);
+   rte_free(rxq->iovecs);
+   rxq->pool = NULL;
+   rxq->iovecs = NULL;
}
if (process_private->txq_fds[i] != -1) {
close(process_private->txq_fds[i]);
@@ -2399,8 +2409,6 @@ rte_pmd_tap_remove(struct rte_vdev_device *dev)
 {
struct rte_eth_dev *eth_dev = NULL;
struct pmd_internals *internals;
-   struct pmd_process_private *process_private;
-   int i;
 
/* find the ethdev entry */
eth_dev = rte_eth_dev_allocated(rte_vdev_device_name(dev));
@@ -2413,28 +2421,12 @@ rte_pmd_tap_remove(struct rte_vdev_device *dev)
if (rte_eal_process_type() != RTE_PROC_PRIMARY)
return rte_eth_dev_release_port(eth_dev);
 
-   internals = eth_dev->data->dev_private;
-   process_private = eth_dev->process_private;
+   tap_dev_close(eth_dev);
 
+   internals = eth_dev->data->dev_private;
TAP_LOG(DEBUG, "Closing %s Ethernet device on numa %u",
tuntap_types[internals->type], rte_socket_id());
 
-   if (internals->nlsk_fd) {
-   tap_flow_flush(eth_dev, NULL);
-   tap_flow_implicit_flush(internals, NULL);
-   tap_nl_final(internals->nlsk_fd);
-   }
-   for (i = 0; i < RTE_PMD_TAP_MAX_QUEUES; i++) {
-   if (process_private->rxq_fds[i] != -1) {
-   close(process_private->rxq_fds[i]);
-   process_private->rxq_fds[i] = -1;
-   }
-   if (process_private->txq_fds[i] != -1) {
-   close(process_private->txq_fds[i]);
-   process_private->txq_fds[i] = -1;
-   }
-   }
-
close(internals->ioctl_sock);
rte_free(eth_dev->process_private);
if (tap_devices_count == 1)
-- 
2.19.1




[dpdk-dev] [PATCH v4 1/5] net/tap: fix mbuf double free when writev fails

2020-04-11 Thread wangyunjian
From: Yunjian Wang 

When the tap_write_mbufs() function return with break, mbuf was freed
without increasing num_packets, which could cause applications to free
the mbuf again. And the pmd_tx_burst() function should returns the
number of original packets it actually sent excluding tso mbufs.

Fixes: 9396ad334672 ("net/tap: fix reported number of Tx packets")
CC: sta...@dpdk.org

Signed-off-by: Yunjian Wang 
---
 drivers/net/tap/rte_eth_tap.c | 34 ++
 1 file changed, 22 insertions(+), 12 deletions(-)

diff --git a/drivers/net/tap/rte_eth_tap.c b/drivers/net/tap/rte_eth_tap.c
index 05470a211..3f4042e5b 100644
--- a/drivers/net/tap/rte_eth_tap.c
+++ b/drivers/net/tap/rte_eth_tap.c
@@ -521,7 +521,7 @@ tap_tx_l3_cksum(char *packet, uint64_t ol_flags, unsigned 
int l2_len,
}
 }
 
-static inline void
+static inline int
 tap_write_mbufs(struct tx_queue *txq, uint16_t num_mbufs,
struct rte_mbuf **pmbufs,
uint16_t *num_packets, unsigned long *num_tx_bytes)
@@ -588,7 +588,7 @@ tap_write_mbufs(struct tx_queue *txq, uint16_t num_mbufs,
seg_len = rte_pktmbuf_data_len(mbuf);
l234_hlen = mbuf->l2_len + mbuf->l3_len + mbuf->l4_len;
if (seg_len < l234_hlen)
-   break;
+   return -1;
 
/* To change checksums, work on a * copy of l2, l3
 * headers + l4 pseudo header
@@ -634,10 +634,12 @@ tap_write_mbufs(struct tx_queue *txq, uint16_t num_mbufs,
/* copy the tx frame data */
n = writev(process_private->txq_fds[txq->queue_id], iovecs, j);
if (n <= 0)
-   break;
+   return -1;
+
(*num_packets)++;
(*num_tx_bytes) += rte_pktmbuf_pkt_len(mbuf);
}
+   return 0;
 }
 
 /* Callback to handle sending packets from the tap interface
@@ -663,8 +665,8 @@ pmd_tx_burst(void *queue, struct rte_mbuf **bufs, uint16_t 
nb_pkts)
uint16_t num_mbufs = 0;
uint16_t tso_segsz = 0;
int ret;
+   int num_tso_mbufs;
uint16_t hdrs_len;
-   int j;
uint64_t tso;
 
tso = mbuf_in->ol_flags & PKT_TX_TCP_SEG;
@@ -686,43 +688,51 @@ pmd_tx_burst(void *queue, struct rte_mbuf **bufs, 
uint16_t nb_pkts)
break;
}
gso_ctx->gso_size = tso_segsz;
-   ret = rte_gso_segment(mbuf_in, /* packet to segment */
+   /* 'mbuf_in' packet to segment */
+   num_tso_mbufs = rte_gso_segment(mbuf_in,
gso_ctx, /* gso control block */
(struct rte_mbuf **)&gso_mbufs, /* out mbufs */
RTE_DIM(gso_mbufs)); /* max tso mbufs */
 
/* ret contains the number of new created mbufs */
-   if (ret < 0)
+   if (num_tso_mbufs < 0)
break;
 
mbuf = gso_mbufs;
-   num_mbufs = ret;
+   num_mbufs = num_tso_mbufs;
} else {
/* stats.errs will be incremented */
if (rte_pktmbuf_pkt_len(mbuf_in) > max_size)
break;
 
/* ret 0 indicates no new mbufs were created */
-   ret = 0;
+   num_tso_mbufs = 0;
mbuf = &mbuf_in;
num_mbufs = 1;
}
 
-   tap_write_mbufs(txq, num_mbufs, mbuf,
+   ret = tap_write_mbufs(txq, num_mbufs, mbuf,
&num_packets, &num_tx_bytes);
+   if (ret == -1) {
+   txq->stats.errs++;
+   /* free tso mbufs */
+   if (num_tso_mbufs > 0)
+   rte_pktmbuf_free_bulk(mbuf, num_tso_mbufs);
+   break;
+   }
num_tx++;
/* free original mbuf */
rte_pktmbuf_free(mbuf_in);
/* free tso mbufs */
-   for (j = 0; j < ret; j++)
-   rte_pktmbuf_free(mbuf[j]);
+   if (num_tso_mbufs > 0)
+   rte_pktmbuf_free_bulk(mbuf, num_tso_mbufs);
}
 
txq->stats.opackets += num_packets;
txq->stats.errs += nb_pkts - num_tx;
txq->stats.obytes += num_tx_bytes;
 
-   return num_packets;
+   return num_tx;
 }
 
 static const char *
-- 
2.19.1




[dpdk-dev] [PATCH v4 0/5] fixes for tap

2020-04-11 Thread wangyunjian
From: Yunjian Wang 

This series include five fixes patches for tap PMD driver.

--
v4:
* Update some code suggested by Ferruh Yigit and Stephen Hemminger
* Update commit log
* Add fix leak of fds on failure
v3:
* Add fix close a vaild fd and netlink socket file descriptor check
  before close
v2:
* Add null check in tap_rxq_pool_free()

Yunjian Wang (5):
  net/tap: fix mbuf double free when writev fails
  net/tap: fix mbuf and mem leak during queue release
  net/tap: fix check for mbuf's nb_segs failure
  net/tap: fix close a valid fd
  net/tap: fix leak of fds on failure

 drivers/net/tap/rte_eth_tap.c | 102 --
 1 file changed, 59 insertions(+), 43 deletions(-)

-- 
2.19.1




[dpdk-dev] [PATCH v4 3/5] net/tap: fix check for mbuf's nb_segs failure

2020-04-11 Thread wangyunjian
From: Yunjian Wang 

Now the rxq->pool is mbuf concatenation, but its nb_segs is 1. When
conducting some sanity checks on the mbuf with debug enabled, it fails.

Fixes: 0781f5762cfe ("net/tap: support segmented mbufs")
CC: sta...@dpdk.org

Signed-off-by: Yunjian Wang 
---
 drivers/net/tap/rte_eth_tap.c | 21 +
 1 file changed, 17 insertions(+), 4 deletions(-)

diff --git a/drivers/net/tap/rte_eth_tap.c b/drivers/net/tap/rte_eth_tap.c
index 0156d689d..6a77b2a7e 100644
--- a/drivers/net/tap/rte_eth_tap.c
+++ b/drivers/net/tap/rte_eth_tap.c
@@ -339,6 +339,19 @@ tap_rx_offload_get_queue_capa(void)
   DEV_RX_OFFLOAD_TCP_CKSUM;
 }
 
+static void
+tap_rxq_pool_free(struct rte_mbuf *pool)
+{
+   struct rte_mbuf *next;
+
+   while (pool) {
+   next = pool->next;
+   pool->next = NULL;
+   rte_pktmbuf_free(pool);
+   pool = next;
+   }
+}
+
 /* Callback to handle the rx burst of packets to the correct interface and
  * file descriptor(s) in a multi-queue setup.
  */
@@ -389,7 +402,7 @@ pmd_rx_burst(void *queue, struct rte_mbuf **bufs, uint16_t 
nb_pkts)
goto end;
 
seg->next = NULL;
-   rte_pktmbuf_free(mbuf);
+   tap_rxq_pool_free(mbuf);
 
goto end;
}
@@ -1038,7 +1051,7 @@ tap_dev_close(struct rte_eth_dev *dev)
rxq = &internals->rxq[i];
close(process_private->rxq_fds[i]);
process_private->rxq_fds[i] = -1;
-   rte_pktmbuf_free(rxq->pool);
+   tap_rxq_pool_free(rxq->pool);
rte_free(rxq->iovecs);
rxq->pool = NULL;
rxq->iovecs = NULL;
@@ -1077,7 +1090,7 @@ tap_rx_queue_release(void *queue)
if (process_private->rxq_fds[rxq->queue_id] > 0) {
close(process_private->rxq_fds[rxq->queue_id]);
process_private->rxq_fds[rxq->queue_id] = -1;
-   rte_pktmbuf_free(rxq->pool);
+   tap_rxq_pool_free(rxq->pool);
rte_free(rxq->iovecs);
rxq->pool = NULL;
rxq->iovecs = NULL;
@@ -1485,7 +1498,7 @@ tap_rx_queue_setup(struct rte_eth_dev *dev,
return 0;
 
 error:
-   rte_pktmbuf_free(rxq->pool);
+   tap_rxq_pool_free(rxq->pool);
rxq->pool = NULL;
rte_free(rxq->iovecs);
rxq->iovecs = NULL;
-- 
2.19.1




[dpdk-dev] [PATCH v4 5/5] net/tap: fix leak of fds on failure

2020-04-11 Thread wangyunjian
From: Yunjian Wang 

When eth_dev_tap_create() is failed, nlsk_fd and ka_fd won't be closed
thus leading fds leak. Zero is a valid fd. Ultimately leads to a valid
fd was closed by mistake.

Fixes: bf7b7f437b49 ("net/tap: create netdevice during probing")
Fixes: cb7e68da630a ("net/tap: fix cleanup on allocation failure")
CC: sta...@dpdk.org

Signed-off-by: Yunjian Wang 
---
 drivers/net/tap/rte_eth_tap.c | 9 +++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/drivers/net/tap/rte_eth_tap.c b/drivers/net/tap/rte_eth_tap.c
index 829a9e9b4..9bea5d9d0 100644
--- a/drivers/net/tap/rte_eth_tap.c
+++ b/drivers/net/tap/rte_eth_tap.c
@@ -1820,6 +1820,8 @@ eth_dev_tap_create(struct rte_vdev_device *vdev, const 
char *tap_name,
pmd->dev = dev;
strlcpy(pmd->name, tap_name, sizeof(pmd->name));
pmd->type = type;
+   pmd->ka_fd = -1;
+   pmd->nlsk_fd = -1;
 
pmd->ioctl_sock = socket(AF_INET, SOCK_DGRAM, 0);
if (pmd->ioctl_sock == -1) {
@@ -1850,7 +1852,6 @@ eth_dev_tap_create(struct rte_vdev_device *vdev, const 
char *tap_name,
dev->intr_handle = &pmd->intr_handle;
 
/* Presetup the fds to -1 as being not valid */
-   pmd->ka_fd = -1;
for (i = 0; i < RTE_PMD_TAP_MAX_QUEUES; i++) {
process_private->rxq_fds[i] = -1;
process_private->txq_fds[i] = -1;
@@ -1990,7 +1991,11 @@ eth_dev_tap_create(struct rte_vdev_device *vdev, const 
char *tap_name,
tap_flow_implicit_flush(pmd, NULL);
 
 error_exit:
-   if (pmd->ioctl_sock > 0)
+   if (pmd->nlsk_fd == -1)
+   close(pmd->nlsk_fd);
+   if (pmd->ka_fd != -1)
+   close(pmd->ka_fd);
+   if (pmd->ioctl_sock != -1)
close(pmd->ioctl_sock);
/* mac_addrs must not be freed alone because part of dev_private */
dev->data->mac_addrs = NULL;
-- 
2.19.1




[dpdk-dev] [PATCH v4 4/5] net/tap: fix close a valid fd

2020-04-11 Thread wangyunjian
From: Yunjian Wang 

The internal structure is freed and set to NULL in the
rte_eth_dev_release_port() and zero is a valid fd. Ultimately
leads to a valid fd was closed by mistake.

Fixes: 3101191c63ab ("net/tap: fix device removal when no queue exist")
CC: sta...@dpdk.org

Signed-off-by: Yunjian Wang 
---
 drivers/net/tap/rte_eth_tap.c | 4 
 1 file changed, 4 deletions(-)

diff --git a/drivers/net/tap/rte_eth_tap.c b/drivers/net/tap/rte_eth_tap.c
index 6a77b2a7e..829a9e9b4 100644
--- a/drivers/net/tap/rte_eth_tap.c
+++ b/drivers/net/tap/rte_eth_tap.c
@@ -2447,10 +2447,6 @@ rte_pmd_tap_remove(struct rte_vdev_device *dev)
tap_devices_count--;
rte_eth_dev_release_port(eth_dev);
 
-   if (internals->ka_fd != -1) {
-   close(internals->ka_fd);
-   internals->ka_fd = -1;
-   }
return 0;
 }
 
-- 
2.19.1




[dpdk-dev] [PATCH v2 1/4] ethdev: add tm support for shaper config in pkt mode

2020-04-11 Thread Nithin Dabilpuram
From: Nithin Dabilpuram 

Some NIC hardware support shaper to work in packet mode i.e
shaping or ratelimiting traffic is in packets per second (PPS) as
opposed to default bytes per second (BPS). Hence this patch
adds support to configure shared or private shaper in packet mode,
provide rate in PPS and add related tm capabilities in port/level/node
capability structures.

This patch also updates tm port/level/node capability structures with
exiting features of scheduler wfq packet mode, scheduler wfq byte mode
and private/shared shaper byte mode.

Signed-off-by: Nithin Dabilpuram 
---

v1..v2:
- Add seperate capability for shaper and scheduler pktmode and bytemode.
- Add packet_mode field in struct rte_tm_shaper_params to indicate
packet mode shaper profile.

 lib/librte_ethdev/rte_tm.h | 156 -
 1 file changed, 154 insertions(+), 2 deletions(-)

diff --git a/lib/librte_ethdev/rte_tm.h b/lib/librte_ethdev/rte_tm.h
index f9c0cf3..38fff4c 100644
--- a/lib/librte_ethdev/rte_tm.h
+++ b/lib/librte_ethdev/rte_tm.h
@@ -250,6 +250,23 @@ struct rte_tm_capabilities {
 */
uint64_t shaper_private_rate_max;
 
+   /** Shaper private packet mode supported. When non-zero, this parameter
+* indicates that there is atleast one node that can be configured
+* with packet mode in it's private shaper. When shaper is configured
+* in packet mode, committed/peak rate provided is interpreted
+* in packets per second.
+*/
+   int shaper_private_packet_mode_supported;
+
+   /** Shaper private byte mode supported. When non-zero, this parameter
+* indicates that there is atleast one node that can be configured
+* with byte mode in it's private shaper. When shaper is configured
+* in byte mode, committed/peak rate provided is interpreted in
+* bytes per second.
+*/
+   int shaper_private_byte_mode_supported;
+
+
/** Maximum number of shared shapers. The value of zero indicates that
 * shared shapers are not supported.
 */
@@ -284,6 +301,21 @@ struct rte_tm_capabilities {
 */
uint64_t shaper_shared_rate_max;
 
+   /** Shaper shared packet mode supported. When non-zero, this parameter
+* indicates a shared shaper can be configured with packet mode.
+* When shared shaper is configured in packet mode, committed/peak rate
+* provided is interpreted in packets per second.
+*/
+   int shaper_shared_packet_mode_supported;
+
+   /** Shaper shared byte mode supported. When non-zero, this parameter
+* indicates that a shared shaper can be configured with byte mode.
+* When shared shaper is configured in byte mode, committed/peak rate
+* provided is interpreted in bytes per second.
+*/
+   int shaper_shared_byte_mode_supported;
+
+
/** Minimum value allowed for packet length adjustment for any private
 * or shared shaper.
 */
@@ -339,6 +371,22 @@ struct rte_tm_capabilities {
 */
uint32_t sched_wfq_weight_max;
 
+   /** WFQ packet mode supported. When non-zero, this parameter indicates
+* that there is at least one non-leaf node that supports packet mode
+* for WFQ among its children. WFQ weights will be applied against
+* packet count for scheduling children when a non-leaf node
+* is configured appropriately.
+*/
+   int sched_wfq_packet_mode_supported;
+
+   /** WFQ byte mode supported. When non-zero, this parameter indicates
+* that there is at least one non-leaf node that supports byte mode
+* for WFQ among its children. WFQ weights will be applied against
+* bytes for scheduling children when a non-leaf node is configured
+* appropriately.
+*/
+   int sched_wfq_byte_mode_supported;
+
/** WRED packet mode support. When non-zero, this parameter indicates
 * that there is at least one leaf node that supports the WRED packet
 * mode, which might not be true for all the leaf nodes. In packet
@@ -485,6 +533,24 @@ struct rte_tm_level_capabilities {
 */
uint64_t shaper_private_rate_max;
 
+   /** Shaper private packet mode supported. When non-zero,
+* this parameter indicates there is atleast one
+* non-leaf node at this level that can be configured
+* with packet mode in its private shaper. When private
+* shaper is configured in packet mode, committed/peak
+* rate provided is interpreted in packets per second.
+*/
+   int shaper_private_packet_mode_supported;
+
+   /** Shaper private byte mode supported. When non-zero,
+* this parameter indicates there

[dpdk-dev] [PATCH v2 2/4] drivers/net: update tm capability for existing pmds

2020-04-11 Thread Nithin Dabilpuram
From: Nithin Dabilpuram 

Since existing PMD's support shaper byte mode and scheduler
wfq byte mode, update the same in their port/level/node capabilities
that are added.

Signed-off-by: Nithin Dabilpuram 
---
v1..v2:
- Newly included patch to change exiting pmd's with tm support of byte mode 
to show the same in port/level/node cap.

 drivers/net/i40e/i40e_tm.c   | 16 
 drivers/net/ipn3ke/ipn3ke_tm.c   | 26 ++
 drivers/net/ixgbe/ixgbe_tm.c | 16 
 drivers/net/mvpp2/mrvl_tm.c  | 14 ++
 drivers/net/softnic/rte_eth_softnic_tm.c | 45 
 5 files changed, 117 insertions(+)

diff --git a/drivers/net/i40e/i40e_tm.c b/drivers/net/i40e/i40e_tm.c
index c76760c..ab272e9 100644
--- a/drivers/net/i40e/i40e_tm.c
+++ b/drivers/net/i40e/i40e_tm.c
@@ -160,12 +160,16 @@ i40e_tm_capabilities_get(struct rte_eth_dev *dev,
cap->shaper_private_rate_min = 0;
/* 40Gbps -> 5GBps */
cap->shaper_private_rate_max = 50ull;
+   cap->shaper_private_packet_mode_supported = 0;
+   cap->shaper_private_byte_mode_supported = 1;
cap->shaper_shared_n_max = 0;
cap->shaper_shared_n_nodes_per_shaper_max = 0;
cap->shaper_shared_n_shapers_per_node_max = 0;
cap->shaper_shared_dual_rate_n_max = 0;
cap->shaper_shared_rate_min = 0;
cap->shaper_shared_rate_max = 0;
+   cap->shaper_shared_packet_mode_supported = 0;
+   cap->shaper_shared_byte_mode_supported = 0;
cap->sched_n_children_max = hw->func_caps.num_tx_qp;
/**
 * HW supports SP. But no plan to support it now.
@@ -179,6 +183,8 @@ i40e_tm_capabilities_get(struct rte_eth_dev *dev,
 * So, all the nodes should have the same weight.
 */
cap->sched_wfq_weight_max = 1;
+   cap->sched_wfq_packet_mode_supported = 0;
+   cap->sched_wfq_byte_mode_supported = 0;
cap->cman_head_drop_supported = 0;
cap->dynamic_update_mask = 0;
cap->shaper_pkt_length_adjust_min = RTE_TM_ETH_FRAMING_OVERHEAD;
@@ -754,6 +760,8 @@ i40e_level_capabilities_get(struct rte_eth_dev *dev,
cap->nonleaf.shaper_private_rate_min = 0;
/* 40Gbps -> 5GBps */
cap->nonleaf.shaper_private_rate_max = 50ull;
+   cap->nonleaf.shaper_private_packet_mode_supported = 0;
+   cap->nonleaf.shaper_private_byte_mode_supported = 1;
cap->nonleaf.shaper_shared_n_max = 0;
if (level_id == I40E_TM_NODE_TYPE_PORT)
cap->nonleaf.sched_n_children_max =
@@ -765,6 +773,8 @@ i40e_level_capabilities_get(struct rte_eth_dev *dev,
cap->nonleaf.sched_wfq_n_children_per_group_max = 0;
cap->nonleaf.sched_wfq_n_groups_max = 0;
cap->nonleaf.sched_wfq_weight_max = 1;
+   cap->nonleaf.sched_wfq_packet_mode_supported = 0;
+   cap->nonleaf.sched_wfq_byte_mode_supported = 0;
cap->nonleaf.stats_mask = 0;
 
return 0;
@@ -776,6 +786,8 @@ i40e_level_capabilities_get(struct rte_eth_dev *dev,
cap->leaf.shaper_private_rate_min = 0;
/* 40Gbps -> 5GBps */
cap->leaf.shaper_private_rate_max = 50ull;
+   cap->leaf.shaper_private_packet_mode_supported = 0;
+   cap->leaf.shaper_private_byte_mode_supported = 1;
cap->leaf.shaper_shared_n_max = 0;
cap->leaf.cman_head_drop_supported = false;
cap->leaf.cman_wred_context_private_supported = true;
@@ -817,6 +829,8 @@ i40e_node_capabilities_get(struct rte_eth_dev *dev,
cap->shaper_private_rate_min = 0;
/* 40Gbps -> 5GBps */
cap->shaper_private_rate_max = 50ull;
+   cap->shaper_private_packet_mode_supported = 0;
+   cap->shaper_private_byte_mode_supported = 1;
cap->shaper_shared_n_max = 0;
 
if (node_type == I40E_TM_NODE_TYPE_QUEUE) {
@@ -834,6 +848,8 @@ i40e_node_capabilities_get(struct rte_eth_dev *dev,
cap->nonleaf.sched_wfq_n_children_per_group_max = 0;
cap->nonleaf.sched_wfq_n_groups_max = 0;
cap->nonleaf.sched_wfq_weight_max = 1;
+   cap->nonleaf.sched_wfq_packet_mode_supported = 0;
+   cap->nonleaf.sched_wfq_byte_mode_supported = 0;
}
 
cap->stats_mask = 0;
diff --git a/drivers/net/ipn3ke/ipn3ke_tm.c b/drivers/net/ipn3ke/ipn3ke_tm.c
index 5a16c5f..35c90b8 100644
--- a/drivers/net/ipn3ke/ipn3ke_tm.c
+++ b/drivers/net/ipn3ke/ipn3ke_tm.c
@@ -440,6 +440,8 @@ ipn3ke_tm_capabilities_get(__rte_unused struct rte_eth_dev 
*dev,
cap->shaper_private_dual_rate_n_max = 0;
cap->shaper_private_rate_min = 1;
cap->shaper_private_rate_max = 1 + IPN3KE_TM_VT_NODE_NUM;
+   cap->shaper_private_packet_mode_supported = 0;
+   cap->shaper_private_byte_mode_supported = 1;
 
cap->shaper_shared_n_max = 0;

[dpdk-dev] [PATCH v2 3/4] app/testpmd: add tm cmd for non leaf and shaper pktmode

2020-04-11 Thread Nithin Dabilpuram
From: Nithin Dabilpuram 

Add TM command to enable packet mode for all SP children
in non leaf node. This is a new command as
"add tm nonleaf node pktmode".

Also add support to shaper profile add command to take
packet mode parameter used to setup shaper in packet mode.
This adds an extra argument "packet_mode" to shaper profile add command
"add port tm node shaper profile" as last argument.

This patch also dumps new tm port/level/node capabilities
sched_wfq_packet_mode_supported, sched_wfq_byte_mode_supported,
shaper_private_packet_mode_supported, shaper_private_byte_mode_supported,
shaper_shared_packet_mode_supported, shaper_shared_byte_mode_supported.

Signed-off-by: Nithin Dabilpuram 
---
v1..v2:
- Update tm capability show cmd to dump lastest pktmode/bytemode fields of v2.
- Update existing shaper profile add command to take last argument as pkt_mode
and update struct rte_tm_shaper_params:packet_mode with the same.
- Update documentation with latest command changes.

 app/test-pmd/cmdline.c  |   9 +-
 app/test-pmd/cmdline_tm.c   | 206 
 app/test-pmd/cmdline_tm.h   |   1 +
 doc/guides/testpmd_app_ug/testpmd_funcs.rst |  40 +-
 4 files changed, 250 insertions(+), 6 deletions(-)

diff --git a/app/test-pmd/cmdline.c b/app/test-pmd/cmdline.c
index 863b567..af90242 100644
--- a/app/test-pmd/cmdline.c
+++ b/app/test-pmd/cmdline.c
@@ -1189,7 +1189,7 @@ static void cmd_help_long_parsed(void *parsed_result,
 
"add port tm node shaper profile (port_id) 
(shaper_profile_id)"
" (cmit_tb_rate) (cmit_tb_size) (peak_tb_rate) 
(peak_tb_size)"
-   " (packet_length_adjust)\n"
+   " (packet_length_adjust) (packet_mode)\n"
"   Add port tm node private shaper profile.\n\n"
 
"del port tm node shaper profile (port_id) 
(shaper_profile_id)\n"
@@ -1221,6 +1221,12 @@ static void cmd_help_long_parsed(void *parsed_result,
" [(shared_shaper_id_0) (shared_shaper_id_1)...]\n"
"   Add port tm nonleaf node.\n\n"
 
+   "add port tm nonleaf node pktmode (port_id) (node_id) 
(parent_node_id)"
+   " (priority) (weight) (level_id) (shaper_profile_id)"
+   " (n_sp_priorities) (stats_mask) (n_shared_shapers)"
+   " [(shared_shaper_id_0) (shared_shaper_id_1)...]\n"
+   "   Add port tm nonleaf node with pkt mode 
enabled.\n\n"
+
"add port tm leaf node (port_id) (node_id) 
(parent_node_id)"
" (priority) (weight) (level_id) (shaper_profile_id)"
" (cman_mode) (wred_profile_id) (stats_mask) 
(n_shared_shapers)"
@@ -19636,6 +19642,7 @@ cmdline_parse_ctx_t main_ctx[] = {
(cmdline_parse_inst_t *)&cmd_del_port_tm_node_wred_profile,
(cmdline_parse_inst_t *)&cmd_set_port_tm_node_shaper_profile,
(cmdline_parse_inst_t *)&cmd_add_port_tm_nonleaf_node,
+   (cmdline_parse_inst_t *)&cmd_add_port_tm_nonleaf_node_pmode,
(cmdline_parse_inst_t *)&cmd_add_port_tm_leaf_node,
(cmdline_parse_inst_t *)&cmd_del_port_tm_node,
(cmdline_parse_inst_t *)&cmd_set_port_tm_node_parent,
diff --git a/app/test-pmd/cmdline_tm.c b/app/test-pmd/cmdline_tm.c
index d62a4f5..c9a2813 100644
--- a/app/test-pmd/cmdline_tm.c
+++ b/app/test-pmd/cmdline_tm.c
@@ -257,6 +257,10 @@ static void cmd_show_port_tm_cap_parsed(void 
*parsed_result,
cap.shaper_private_rate_min);
printf("cap.shaper_private_rate_max %" PRIu64 "\n",
cap.shaper_private_rate_max);
+   printf("cap.shaper_private_packet_mode_supported %" PRId32 "\n",
+   cap.shaper_private_packet_mode_supported);
+   printf("cap.shaper_private_byte_mode_supported %" PRId32 "\n",
+   cap.shaper_private_byte_mode_supported);
printf("cap.shaper_shared_n_max %" PRIu32 "\n",
cap.shaper_shared_n_max);
printf("cap.shaper_shared_n_nodes_per_shaper_max %" PRIu32 "\n",
@@ -269,6 +273,10 @@ static void cmd_show_port_tm_cap_parsed(void 
*parsed_result,
cap.shaper_shared_rate_min);
printf("cap.shaper_shared_rate_max %" PRIu64 "\n",
cap.shaper_shared_rate_max);
+   printf("cap.shaper_shared_packet_mode_supported %" PRId32 "\n",
+   cap.shaper_shared_packet_mode_supported);
+   printf("cap.shaper_shared_byte_mode_supported %" PRId32 "\n",
+   cap.shaper_shared_byte_mode_supported);
printf("cap.shaper_pkt_length_adjust_min %" PRId32 "\n",
cap.shaper_pkt_length_adjust_min);
printf("cap.shaper_pkt_length_adjust_max %" PRId32 "\n",
@@ -283,6 +291,10 @@ static void cmd_show_port_tm_cap_parsed(void 
*parsed_result,
cap.sched_wfq_n_groups_max);
 

[dpdk-dev] [PATCH v2 4/4] net/octeontx2: support tm length adjust and pkt mode

2020-04-11 Thread Nithin Dabilpuram
From: Nithin Dabilpuram 

This patch adds support to packet length adjust TM feature
for private shaper. It also adds support to packet mode
feature that applies both to private shaper and node DWRR
scheduling of SP children.

Signed-off-by: Nithin Dabilpuram 
---
v1..v2:
- Newly included patch.

 drivers/net/octeontx2/otx2_tm.c | 140 +---
 drivers/net/octeontx2/otx2_tm.h |   5 ++
 2 files changed, 122 insertions(+), 23 deletions(-)

diff --git a/drivers/net/octeontx2/otx2_tm.c b/drivers/net/octeontx2/otx2_tm.c
index f94618d..fa7d21b 100644
--- a/drivers/net/octeontx2/otx2_tm.c
+++ b/drivers/net/octeontx2/otx2_tm.c
@@ -336,18 +336,25 @@ prepare_tm_shaper_reg(struct otx2_nix_tm_node *tm_node,
 {
struct shaper_params cir, pir;
uint32_t schq = tm_node->hw_id;
+   uint64_t adjust = 0;
uint8_t k = 0;
 
memset(&cir, 0, sizeof(cir));
memset(&pir, 0, sizeof(pir));
shaper_config_to_nix(profile, &cir, &pir);
 
-   otx2_tm_dbg("Shaper config node %s(%u) lvl %u id %u, "
-   "pir %" PRIu64 "(%" PRIu64 "B),"
-" cir %" PRIu64 "(%" PRIu64 "B) (%p)",
-nix_hwlvl2str(tm_node->hw_lvl), schq, tm_node->lvl,
-tm_node->id, pir.rate, pir.burst,
-cir.rate, cir.burst, tm_node);
+   /* Packet length adjust */
+   if (tm_node->pkt_mode)
+   adjust = 1;
+   else if (profile)
+   adjust = profile->params.pkt_length_adjust & 0x1FF;
+
+   otx2_tm_dbg("Shaper config node %s(%u) lvl %u id %u, pir %" PRIu64
+   "(%" PRIu64 "B), cir %" PRIu64 "(%" PRIu64 "B)"
+   "adjust 0x%" PRIx64 "(pktmode %u) (%p)",
+   nix_hwlvl2str(tm_node->hw_lvl), schq, tm_node->lvl,
+   tm_node->id, pir.rate, pir.burst, cir.rate, cir.burst,
+   adjust, tm_node->pkt_mode, tm_node);
 
switch (tm_node->hw_lvl) {
case NIX_TXSCH_LVL_SMQ:
@@ -364,7 +371,9 @@ prepare_tm_shaper_reg(struct otx2_nix_tm_node *tm_node,
 
/* Configure RED ALG */
reg[k] = NIX_AF_MDQX_SHAPE(schq);
-   regval[k] = ((uint64_t)tm_node->red_algo << 9);
+   regval[k] = (adjust |
+(uint64_t)tm_node->red_algo << 9 |
+(uint64_t)tm_node->pkt_mode << 24);
k++;
break;
case NIX_TXSCH_LVL_TL4:
@@ -381,7 +390,9 @@ prepare_tm_shaper_reg(struct otx2_nix_tm_node *tm_node,
 
/* Configure RED algo */
reg[k] = NIX_AF_TL4X_SHAPE(schq);
-   regval[k] = ((uint64_t)tm_node->red_algo << 9);
+   regval[k] = (adjust |
+(uint64_t)tm_node->red_algo << 9 |
+(uint64_t)tm_node->pkt_mode << 24);
k++;
break;
case NIX_TXSCH_LVL_TL3:
@@ -398,7 +409,9 @@ prepare_tm_shaper_reg(struct otx2_nix_tm_node *tm_node,
 
/* Configure RED algo */
reg[k] = NIX_AF_TL3X_SHAPE(schq);
-   regval[k] = ((uint64_t)tm_node->red_algo << 9);
+   regval[k] = (adjust |
+(uint64_t)tm_node->red_algo << 9 |
+(uint64_t)tm_node->pkt_mode << 24);
k++;
 
break;
@@ -416,7 +429,9 @@ prepare_tm_shaper_reg(struct otx2_nix_tm_node *tm_node,
 
/* Configure RED algo */
reg[k] = NIX_AF_TL2X_SHAPE(schq);
-   regval[k] = ((uint64_t)tm_node->red_algo << 9);
+   regval[k] = (adjust |
+(uint64_t)tm_node->red_algo << 9 |
+(uint64_t)tm_node->pkt_mode << 24);
k++;
 
break;
@@ -426,6 +441,12 @@ prepare_tm_shaper_reg(struct otx2_nix_tm_node *tm_node,
regval[k] = (cir.rate && cir.burst) ?
(shaper2regval(&cir) | 1) : 0;
k++;
+
+   /* Configure length disable and adjust */
+   reg[k] = NIX_AF_TL1X_SHAPE(schq);
+   regval[k] = (adjust |
+(uint64_t)tm_node->pkt_mode << 24);
+   k++;
break;
}
 
@@ -773,6 +794,15 @@ nix_tm_node_add_to_list(struct otx2_eth_dev *dev, uint32_t 
node_id,
tm_node->flags = 0;
if (user)
tm_node->flags = NIX_TM_NODE_USER;
+
+   /* Packet mode */
+   if (!nix_tm_is_leaf(dev, lvl) &&
+   ((profile && profile->params.packet_mode) ||
+(params->nonleaf.wfq_weight_mode &&
+ params->nonleaf.n_sp_priorities &&
+ !params->nonleaf.wfq_weight_mode[0])))
+   tm_node->pkt_mode = 1;
+
rte_memcpy(&tm_node->params, params, sizeof(struct rte_tm_node_params));
 
if (profile)
@@ -1873,8 +1903,10 @@ otx2_nix_tm_cap

[dpdk-dev] [PATCH v5 00/29] graph: introduce graph subsystem

2020-04-11 Thread jerinj
From: Jerin Jacob 

Using graph traversal for packet processing is a proven architecture
that has been implemented in various open source libraries.

Graph architecture for packet processing enables abstracting the data
processing functions as “nodes” and “links” them together to create a
complex “graph” to create reusable/modular data processing functions. 

The patchset further includes performance enhancements and modularity
to the DPDK as discussed in more detail below.

v5..v4:
--
Addressed the following review comments from Andrzej Ostruszka.

1) Addressed and comment in 
(http://mails.dpdk.org/archives/dev/2020-April/162184.html)
and improved following function prototypes/return types and adjusted the
implementation
a) rte_graph_node_get
b) rte_graph_max_count
c) rte_graph_export
d) rte_graph_destroy
2) Updated UT and l3fwd-graph for updated function prototype
3) bug fix in edge_update
4) avoid reading graph_src_nodes_count() twice in rte_graph_create()
5) Fix graph_mem_fixup_secondray typo
6) Fixed Doxygen comments for rte_node_next_stream_put
7) Updated the documentation to reflect the same.
8) Removed RTE prefix from rte_node_mbuf_priv[1|2] * as they are
internal defines
9) Limited next_hop id provided to LPM route add in
librte_node/ip4_lookup.c to 24 bits ()
10) Fixed pattern array overflow issue with l3fwd-graph/main.c by
splitting pattern
array to default + non-default array. Updated doc with the same info.
11) Fixed parsing issues in parse_config() in l3fwd-graph/main.c inline
with issues reported
in l2fwd-event
12)Removed next_hop field in l3fwd-graph/main.c main()
13) Fixed graph create error check in l3fwd-graph/main.c main()

v4..v3:
---
Addressed the following review comments from Wang, Xiao W

1) Remove unnecessary line from rte_graph.h
2) Fix a typo from rte_graph.h
3) Move NODE_ID_CHECK to 3rd patch where it is first used.
4) Fixed bug in edge_update()

v3..v2:
---
1) refactor ipv4 node lookup by moving SSE and NEON specific code to
lib/librte_node/ip4_lookup_sse.h and lib/librte_node/ip4_lookup_neon.h
2) Add scalar version of process() function for ipv4 lookup to make
the node work on NON x86 and arm64 machines.

v2..v1:
--
1) Added programmer guide/implementation documentation and l3fwd-graph doc

RFC..v1:


1) Split the patch to more logical ones for review.
2) Added doxygen comments for the API
3) Code cleanup
4) Additional performance improvements.
Delta between l3fwd and l3fwd-graph is negligible now.
(~1%) on octeontx2.
5) Added SIMD routines for x86 in additional to arm64.

Hosted in netlify for easy reference:

Programmer’s Guide:
https://dpdk-graph.netlify.com/doc/html/guides/prog_guide/graph_lib.html

l3fwd-graph doc:
https://dpdk-graph.netlify.com/doc/html/guides/sample_app_ug/l3_forward_graph.html

API doc:
https://dpdk-graph.netlify.com/doc/html/api/rte__graph_8h.html
https://dpdk-graph.netlify.com/doc/html/api/rte__graph__worker_8h.html
https://dpdk-graph.netlify.com/doc/html/api/rte__node__eth__api_8h.html
https://dpdk-graph.netlify.com/doc/html/api/rte__node__ip4__api_8h.html

2) Added the release notes for the this feature

3) Fix build issues reported by CI for v1:
http://mails.dpdk.org/archives/test-report/2020-March/121326.html


Addional nodes planned for v20.08
--
1) Packet classification node
2) Support for IPV6 LPM node


This patchset contains
-
1) The API definition to "create" nodes and "link" together to create a
"graph" for packet processing. See, lib/librte_graph/rte_graph.h  

2) The Fast path API definition for the graph walker and enqueue
function used by the workers. See, lib/librte_graph/rte_graph_worker.h

3) Optimized SW implementation for (1) and (2). See, lib/librte_graph/

4) Test case to verify the graph infrastructure functionality
See, app/test/test_graph.c
 
5) Performance test cases to evaluate the cost of graph walker and nodes
enqueue fast-path function for various combinations.

See app/test/test_graph_perf.c

6) Packet processing nodes(Null, Rx, Tx, Pkt drop, IPV4 rewrite, IPv4
lookup)
using graph infrastructure. See lib/librte_node/*

7) An example application to showcase l3fwd
(functionality same as existing examples/l3fwd) using graph
infrastructure and use packets processing nodes (item (6)). See 
examples/l3fwd-graph/.

Performance
---
1) Graph walk and node enqueue overhead can be tested with performance
test case application [1]
# If all packets go from a node to another node (we call it as
# "homerun") then it will be just a pointer swap for a burst of packets.
# In the worst case, a couple of handful cycles to move an object from a
node to another node.

2) Performance comparison with existing l3fwd (The complete static code
with out any nodes) vs modular l3fwd-graph with 5 nodes
(ip4_lookup, ip4_rewrite, ethdev_tx, ethdev_rx, pkt_drop).
Here is graphical representation of the l3fwd-graph as Graphviz

[dpdk-dev] [PATCH v5 02/29] graph: implement node registration

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding rte_node_register() API implementation includes allocating
memory for node object, check for duplicate node name and
add the allocated node to STAILQ node_list for future use.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/Makefile  |   1 +
 lib/librte_graph/graph.c   |  18 +++-
 lib/librte_graph/graph_private.h   |  75 
 lib/librte_graph/meson.build   |   2 +-
 lib/librte_graph/node.c| 113 +
 lib/librte_graph/rte_graph_version.map |   4 +
 6 files changed, 211 insertions(+), 2 deletions(-)
 create mode 100644 lib/librte_graph/graph_private.h
 create mode 100644 lib/librte_graph/node.c

diff --git a/lib/librte_graph/Makefile b/lib/librte_graph/Makefile
index 26fe514f3..933d0ee49 100644
--- a/lib/librte_graph/Makefile
+++ b/lib/librte_graph/Makefile
@@ -14,6 +14,7 @@ LDLIBS += -lrte_eal
 EXPORT_MAP := rte_graph_version.map
 
 # all source are stored in SRCS-y
+SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += node.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph.c
 
 # install header files
diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index a55bf443a..a9c124896 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -2,4 +2,20 @@
  * Copyright(C) 2020 Marvell International Ltd.
  */
 
-#include "rte_graph.h"
+#include 
+
+#include "graph_private.h"
+
+static rte_spinlock_t graph_lock = RTE_SPINLOCK_INITIALIZER;
+
+void
+graph_spinlock_lock(void)
+{
+   rte_spinlock_lock(&graph_lock);
+}
+
+void
+graph_spinlock_unlock(void)
+{
+   rte_spinlock_unlock(&graph_lock);
+}
diff --git a/lib/librte_graph/graph_private.h b/lib/librte_graph/graph_private.h
new file mode 100644
index 0..8b9ff5292
--- /dev/null
+++ b/lib/librte_graph/graph_private.h
@@ -0,0 +1,75 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#ifndef _RTE_GRAPH_PRIVATE_H_
+#define _RTE_GRAPH_PRIVATE_H_
+
+#include 
+#include 
+
+#include 
+#include 
+
+#include "rte_graph.h"
+
+/**
+ * @internal
+ *
+ * Structure that holds node internal data.
+ */
+struct node {
+   STAILQ_ENTRY(node) next;  /**< Next node in the list. */
+   char name[RTE_NODE_NAMESIZE]; /**< Name of the node. */
+   uint64_t flags;   /**< Node configuration flag. */
+   rte_node_process_t process;   /**< Node process function. */
+   rte_node_init_t init; /**< Node init function. */
+   rte_node_fini_t fini; /**< Node fini function. */
+   rte_node_t id;/**< Allocated identifier for the node. */
+   rte_node_t parent_id; /**< Parent node identifier. */
+   rte_edge_t nb_edges;  /**< Number of edges from this node. */
+   char next_nodes[][RTE_NODE_NAMESIZE]; /**< Names of next nodes. */
+};
+
+/* Node functions */
+STAILQ_HEAD(node_head, node);
+
+/**
+ * @internal
+ *
+ * Get the head of the node list.
+ *
+ * @return
+ *   Pointer to the node head.
+ */
+struct node_head *node_list_head_get(void);
+
+/**
+ * @internal
+ *
+ * Get node pointer from node name.
+ *
+ * @param name
+ *   Pointer to character string containing the node name.
+ *
+ * @return
+ *   Pointer to the node.
+ */
+struct node *node_from_name(const char *name);
+
+/* Lock functions */
+/**
+ * @internal
+ *
+ * Take a lock on the graph internal spin lock.
+ */
+void graph_spinlock_lock(void);
+
+/**
+ * @internal
+ *
+ * Release a lock on the graph internal spin lock.
+ */
+void graph_spinlock_unlock(void);
+
+#endif /* _RTE_GRAPH_PRIVATE_H_ */
diff --git a/lib/librte_graph/meson.build b/lib/librte_graph/meson.build
index 455cf2ba5..5754ac23b 100644
--- a/lib/librte_graph/meson.build
+++ b/lib/librte_graph/meson.build
@@ -4,7 +4,7 @@
 
 name = 'graph'
 
-sources = files('graph.c')
+sources = files('node.c', 'graph.c')
 headers = files('rte_graph.h')
 allow_experimental_apis = true
 
diff --git a/lib/librte_graph/node.c b/lib/librte_graph/node.c
new file mode 100644
index 0..336cd1c94
--- /dev/null
+++ b/lib/librte_graph/node.c
@@ -0,0 +1,113 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "graph_private.h"
+
+static struct node_head node_list = STAILQ_HEAD_INITIALIZER(node_list);
+static rte_node_t node_id;
+
+/* Private functions */
+struct node_head *
+node_list_head_get(void)
+{
+   return &node_list;
+}
+
+struct node *
+node_from_name(const char *name)
+{
+   struct node *node;
+
+   STAILQ_FOREACH(node, &node_list, next)
+   if (strncmp(node->name, name, RTE_NODE_NAMESIZE) == 0)
+   return node;
+
+   return NULL;
+}
+
+static bool
+node_has_duplicate_entry(const char *name)
+{
+   struct node 

[dpdk-dev] [PATCH v5 01/29] graph: define the public API for graph support

2020-04-11 Thread jerinj
From: Jerin Jacob 

Graph architecture abstracts the data processing functions as
"node" and "link" them together to create a complex "graph" to enable
reusable/modular data processing functions.

These APIs enables graph framework operations such as create, lookup,
dump and destroy on graph and node operations such as clone,
edge update, and edge shrink, etc. The API also allows creating the
stats cluster to monitor per graph and per node stats.

This patch defines the public API for graph support.
This patch also adds support for the build infrastructure and
update the MAINTAINERS file for the graph subsystem.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 MAINTAINERS|   5 +
 config/common_base |   7 +
 config/rte_config.h|   4 +
 doc/api/doxy-api-index.md  |   1 +
 doc/api/doxy-api.conf.in   |   1 +
 lib/Makefile   |   3 +
 lib/librte_graph/Makefile  |  22 +
 lib/librte_graph/graph.c   |   5 +
 lib/librte_graph/meson.build   |  11 +
 lib/librte_graph/rte_graph.h   | 668 +
 lib/librte_graph/rte_graph_version.map |   3 +
 lib/meson.build|   2 +-
 mk/rte.app.mk  |   1 +
 13 files changed, 732 insertions(+), 1 deletion(-)
 create mode 100644 lib/librte_graph/Makefile
 create mode 100644 lib/librte_graph/graph.c
 create mode 100644 lib/librte_graph/meson.build
 create mode 100644 lib/librte_graph/rte_graph.h
 create mode 100644 lib/librte_graph/rte_graph_version.map

diff --git a/MAINTAINERS b/MAINTAINERS
index 4800f6884..aa40cc92b 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -1462,6 +1462,11 @@ F: examples/bpf/
 F: app/test/test_bpf.c
 F: doc/guides/prog_guide/bpf_lib.rst
 
+Graph - EXPERIMENTAL
+M: Jerin Jacob 
+M: Kiran Kumar K 
+F: lib/librte_graph/
+
 
 Test Applications
 -
diff --git a/config/common_base b/config/common_base
index c31175f9d..32f982136 100644
--- a/config/common_base
+++ b/config/common_base
@@ -1074,6 +1074,13 @@ CONFIG_RTE_LIBRTE_BPF_ELF=n
 #
 CONFIG_RTE_LIBRTE_IPSEC=y
 
+#
+# Compile librte_graph
+#
+CONFIG_RTE_LIBRTE_GRAPH=y
+CONFIG_RTE_GRAPH_BURST_SIZE=256
+CONFIG_RTE_LIBRTE_GRAPH_STATS=y
+
 #
 # Compile the test application
 #
diff --git a/config/rte_config.h b/config/rte_config.h
index d30786bc0..e9201fd46 100644
--- a/config/rte_config.h
+++ b/config/rte_config.h
@@ -98,6 +98,10 @@
 /* KNI defines */
 #define RTE_KNI_PREEMPT_DEFAULT 1
 
+/* rte_graph defines */
+#define RTE_GRAPH_BURST_SIZE 256
+#define RTE_LIBRTE_GRAPH_STATS 1
+
 /** driver defines /
 
 /* QuickAssist device */
diff --git a/doc/api/doxy-api-index.md b/doc/api/doxy-api-index.md
index dff496be0..5cc50f750 100644
--- a/doc/api/doxy-api-index.md
+++ b/doc/api/doxy-api-index.md
@@ -159,6 +159,7 @@ The public API headers are grouped by topics:
   * [pipeline] (@ref rte_pipeline.h)
 [port_in_action]   (@ref rte_port_in_action.h)
 [table_action] (@ref rte_table_action.h)
+  * [graph](@ref rte_graph.h):
 
 - **basic**:
   [approx fraction](@ref rte_approx.h),
diff --git a/doc/api/doxy-api.conf.in b/doc/api/doxy-api.conf.in
index 65e8146be..e3b7f54f8 100644
--- a/doc/api/doxy-api.conf.in
+++ b/doc/api/doxy-api.conf.in
@@ -33,6 +33,7 @@ INPUT   = @TOPDIR@/doc/api/doxy-api-index.md \
   @TOPDIR@/lib/librte_eventdev \
   @TOPDIR@/lib/librte_fib \
   @TOPDIR@/lib/librte_flow_classify \
+  @TOPDIR@/lib/librte_graph \
   @TOPDIR@/lib/librte_gro \
   @TOPDIR@/lib/librte_gso \
   @TOPDIR@/lib/librte_hash \
diff --git a/lib/Makefile b/lib/Makefile
index 46b91ae1a..1f572b659 100644
--- a/lib/Makefile
+++ b/lib/Makefile
@@ -119,6 +119,9 @@ DEPDIRS-librte_telemetry := librte_eal librte_metrics 
librte_ethdev
 DIRS-$(CONFIG_RTE_LIBRTE_RCU) += librte_rcu
 DEPDIRS-librte_rcu := librte_eal
 
+DIRS-$(CONFIG_RTE_LIBRTE_GRAPH) += librte_graph
+DEPDIRS-librte_graph := librte_eal
+
 ifeq ($(CONFIG_RTE_EXEC_ENV_LINUX),y)
 DIRS-$(CONFIG_RTE_LIBRTE_KNI) += librte_kni
 endif
diff --git a/lib/librte_graph/Makefile b/lib/librte_graph/Makefile
new file mode 100644
index 0..26fe514f3
--- /dev/null
+++ b/lib/librte_graph/Makefile
@@ -0,0 +1,22 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(C) 2020 Marvell International Ltd.
+#
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+# library name
+LIB = librte_graph.a
+
+CFLAGS += -O3 -DALLOW_EXPERIMENTAL_API
+CFLAGS += $(WERROR_FLAGS)
+LDLIBS += -lrte_eal
+
+EXPORT_MAP := rte_graph_version.map
+
+# all source are stored in SRCS-y
+SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph.c
+
+# install header files
+SYMLINK-$(CONFIG_RTE_LIBRTE_GRAPH)-include += rte

[dpdk-dev] [PATCH v5 03/29] graph: implement node operations

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding node-specific API implementation like cloning node, updating
edges for the node, shrinking edges of a node, retrieving edges of a
node.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/graph_private.h   |  10 +
 lib/librte_graph/node.c| 271 +
 lib/librte_graph/rte_graph_version.map |  10 +
 3 files changed, 291 insertions(+)

diff --git a/lib/librte_graph/graph_private.h b/lib/librte_graph/graph_private.h
index 8b9ff5292..7ed6d01b6 100644
--- a/lib/librte_graph/graph_private.h
+++ b/lib/librte_graph/graph_private.h
@@ -13,6 +13,16 @@
 
 #include "rte_graph.h"
 
+
+#define ID_CHECK(id, id_max)   
\
+   do {   \
+   if ((id) >= (id_max)) {\
+   rte_errno = EINVAL;\
+   goto fail; \
+   }  \
+   } while (0)
+
+
 /**
  * @internal
  *
diff --git a/lib/librte_graph/node.c b/lib/librte_graph/node.c
index 336cd1c94..392e534a9 100644
--- a/lib/librte_graph/node.c
+++ b/lib/librte_graph/node.c
@@ -17,6 +17,8 @@
 static struct node_head node_list = STAILQ_HEAD_INITIALIZER(node_list);
 static rte_node_t node_id;
 
+#define NODE_ID_CHECK(id) ID_CHECK(id, node_id)
+
 /* Private functions */
 struct node_head *
 node_list_head_get(void)
@@ -111,3 +113,272 @@ __rte_node_register(const struct rte_node_register *reg)
return RTE_NODE_ID_INVALID;
 }
 
+static int
+clone_name(struct rte_node_register *reg, struct node *node, const char *name)
+{
+   ssize_t sz, rc;
+
+#define SZ RTE_NODE_NAMESIZE
+   rc = rte_strscpy(reg->name, node->name, SZ);
+   if (rc < 0)
+   goto fail;
+   sz = rc;
+   rc = rte_strscpy(reg->name + sz, "-", RTE_MAX((int16_t)(SZ - sz), 0));
+   if (rc < 0)
+   goto fail;
+   sz += rc;
+   sz = rte_strscpy(reg->name + sz, name, RTE_MAX((int16_t)(SZ - sz), 0));
+   if (sz < 0)
+   goto fail;
+
+   return 0;
+fail:
+   rte_errno = E2BIG;
+   return -rte_errno;
+}
+
+static rte_node_t
+node_clone(struct node *node, const char *name)
+{
+   rte_node_t rc = RTE_NODE_ID_INVALID;
+   struct rte_node_register *reg;
+   rte_edge_t i;
+
+   /* Don't allow to clone a node from a cloned node */
+   if (node->parent_id != RTE_NODE_ID_INVALID) {
+   rte_errno = EEXIST;
+   goto fail;
+   }
+
+   /* Check for duplicate name */
+   if (node_has_duplicate_entry(name))
+   goto fail;
+
+   reg = calloc(1, sizeof(*reg) + (sizeof(char *) * node->nb_edges));
+   if (reg == NULL) {
+   rte_errno = ENOMEM;
+   goto fail;
+   }
+
+   /* Clone the source node */
+   reg->flags = node->flags;
+   reg->process = node->process;
+   reg->init = node->init;
+   reg->fini = node->fini;
+   reg->nb_edges = node->nb_edges;
+   reg->parent_id = node->id;
+
+   for (i = 0; i < node->nb_edges; i++)
+   reg->next_nodes[i] = node->next_nodes[i];
+
+   /* Naming ceremony of the new node. name is node->name + "-" + name */
+   if (clone_name(reg, node, name))
+   goto free;
+
+   rc = __rte_node_register(reg);
+free:
+   free(reg);
+fail:
+   return rc;
+}
+
+rte_node_t
+rte_node_clone(rte_node_t id, const char *name)
+{
+   struct node *node;
+
+   NODE_ID_CHECK(id);
+   STAILQ_FOREACH(node, &node_list, next)
+   if (node->id == id)
+   return node_clone(node, name);
+
+fail:
+   return RTE_NODE_ID_INVALID;
+}
+
+rte_node_t
+rte_node_from_name(const char *name)
+{
+   struct node *node;
+
+   STAILQ_FOREACH(node, &node_list, next)
+   if (strncmp(node->name, name, RTE_NODE_NAMESIZE) == 0)
+   return node->id;
+
+   return RTE_NODE_ID_INVALID;
+}
+
+char *
+rte_node_id_to_name(rte_node_t id)
+{
+   struct node *node;
+
+   NODE_ID_CHECK(id);
+   STAILQ_FOREACH(node, &node_list, next)
+   if (node->id == id)
+   return node->name;
+
+fail:
+   return NULL;
+}
+
+rte_edge_t
+rte_node_edge_count(rte_node_t id)
+{
+   struct node *node;
+
+   NODE_ID_CHECK(id);
+   STAILQ_FOREACH(node, &node_list, next)
+   if (node->id == id)
+   return node->nb_edges;
+fail:
+   return RTE_EDGE_ID_INVALID;
+}
+
+static rte_edge_t
+edge_update(struct node *node, struct node *prev, rte_edge_t from,
+   const char **next_nodes, rte_edge_t nb_edges)
+{
+   rte_edge_t i, max_edges, c

[dpdk-dev] [PATCH v5 04/29] graph: implement node debug routines

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding node debug API implementation support to dump
single or all the node objects to the given file.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/Makefile  |  1 +
 lib/librte_graph/graph_debug.c | 25 
 lib/librte_graph/graph_private.h   | 12 ++
 lib/librte_graph/meson.build   |  2 +-
 lib/librte_graph/node.c| 32 ++
 lib/librte_graph/rte_graph_version.map |  1 +
 6 files changed, 72 insertions(+), 1 deletion(-)
 create mode 100644 lib/librte_graph/graph_debug.c

diff --git a/lib/librte_graph/Makefile b/lib/librte_graph/Makefile
index 933d0ee49..2a6d86933 100644
--- a/lib/librte_graph/Makefile
+++ b/lib/librte_graph/Makefile
@@ -16,6 +16,7 @@ EXPORT_MAP := rte_graph_version.map
 # all source are stored in SRCS-y
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += node.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph.c
+SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_debug.c
 
 # install header files
 SYMLINK-$(CONFIG_RTE_LIBRTE_GRAPH)-include += rte_graph.h
diff --git a/lib/librte_graph/graph_debug.c b/lib/librte_graph/graph_debug.c
new file mode 100644
index 0..75238e7ca
--- /dev/null
+++ b/lib/librte_graph/graph_debug.c
@@ -0,0 +1,25 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+
+#include "graph_private.h"
+
+void
+node_dump(FILE *f, struct node *n)
+{
+   rte_edge_t i;
+
+   fprintf(f, "node <%s>\n", n->name);
+   fprintf(f, "  id=%" PRIu32 "\n", n->id);
+   fprintf(f, "  flags=0x%" PRIx64 "\n", n->flags);
+   fprintf(f, "  addr=%p\n", n);
+   fprintf(f, "  process=%p\n", n->process);
+   fprintf(f, "  nb_edges=%d\n", n->nb_edges);
+
+   for (i = 0; i < n->nb_edges; i++)
+   fprintf(f, " edge[%d] <%s>\n", i, n->next_nodes[i]);
+}
+
diff --git a/lib/librte_graph/graph_private.h b/lib/librte_graph/graph_private.h
index 7ed6d01b6..6db04cee7 100644
--- a/lib/librte_graph/graph_private.h
+++ b/lib/librte_graph/graph_private.h
@@ -82,4 +82,16 @@ void graph_spinlock_lock(void);
  */
 void graph_spinlock_unlock(void);
 
+/**
+ * @internal
+ *
+ * Dump internal node object data.
+ *
+ * @param f
+ *   FILE pointer to dump the info.
+ * @param g
+ *   Pointer to the internal node object.
+ */
+void node_dump(FILE *f, struct node *n);
+
 #endif /* _RTE_GRAPH_PRIVATE_H_ */
diff --git a/lib/librte_graph/meson.build b/lib/librte_graph/meson.build
index 5754ac23b..01512182f 100644
--- a/lib/librte_graph/meson.build
+++ b/lib/librte_graph/meson.build
@@ -4,7 +4,7 @@
 
 name = 'graph'
 
-sources = files('node.c', 'graph.c')
+sources = files('node.c', 'graph.c', 'graph_debug.c')
 headers = files('rte_graph.h')
 allow_experimental_apis = true
 
diff --git a/lib/librte_graph/node.c b/lib/librte_graph/node.c
index 392e534a9..0652d40c2 100644
--- a/lib/librte_graph/node.c
+++ b/lib/librte_graph/node.c
@@ -377,6 +377,38 @@ rte_node_edge_get(rte_node_t id, char *next_nodes[])
return rc;
 }
 
+static void
+node_scan_dump(FILE *f, rte_node_t id, bool all)
+{
+   struct node *node;
+
+   RTE_ASSERT(f != NULL);
+   NODE_ID_CHECK(id);
+
+   STAILQ_FOREACH(node, &node_list, next) {
+   if (all == true) {
+   node_dump(f, node);
+   } else if (node->id == id) {
+   node_dump(f, node);
+   return;
+   }
+   }
+fail:
+   return;
+}
+
+void
+rte_node_dump(FILE *f, rte_node_t id)
+{
+   node_scan_dump(f, id, false);
+}
+
+void
+rte_node_list_dump(FILE *f)
+{
+   node_scan_dump(f, 0, true);
+}
+
 rte_node_t
 rte_node_max_count(void)
 {
diff --git a/lib/librte_graph/rte_graph_version.map 
b/lib/librte_graph/rte_graph_version.map
index 412386356..f2c2139c5 100644
--- a/lib/librte_graph/rte_graph_version.map
+++ b/lib/librte_graph/rte_graph_version.map
@@ -4,6 +4,7 @@ EXPERIMENTAL {
__rte_node_register;
 
rte_node_clone;
+   rte_node_dump;
rte_node_edge_count;
rte_node_edge_get;
rte_node_edge_shrink;
-- 
2.25.1



[dpdk-dev] [PATCH v5 06/29] graph: populate fastpath memory for graph reel

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding support to create and populate the memory for graph reel.
This includes reserving the memory in the memzone, populating the nodes,
Allocating memory for node-specific streams to hold objects.

Once it is populated the reel memory contains the following sections.

+-+
|   Graph Header  |
+-+
|   Fence |
+-+
|   Circular buffer   |
+-+
|   Fence |
+-+
|   Node Object 0 |
+--- -+
|   Node Object 1 |
+--- -+
|   Node Object 2 |
+--- -+
|   Node Object n |
+--- -+

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/Makefile  |   2 +
 lib/librte_graph/graph.c   |  16 ++
 lib/librte_graph/graph_populate.c  | 234 +
 lib/librte_graph/graph_private.h   |  64 +++
 lib/librte_graph/meson.build   |   4 +-
 lib/librte_graph/node.c|   5 +
 lib/librte_graph/rte_graph_version.map |   1 +
 lib/librte_graph/rte_graph_worker.h| 106 +++
 8 files changed, 430 insertions(+), 2 deletions(-)
 create mode 100644 lib/librte_graph/graph_populate.c
 create mode 100644 lib/librte_graph/rte_graph_worker.h

diff --git a/lib/librte_graph/Makefile b/lib/librte_graph/Makefile
index 39ecb2652..7bfd7d51f 100644
--- a/lib/librte_graph/Makefile
+++ b/lib/librte_graph/Makefile
@@ -18,8 +18,10 @@ SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += node.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_ops.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_debug.c
+SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_populate.c
 
 # install header files
 SYMLINK-$(CONFIG_RTE_LIBRTE_GRAPH)-include += rte_graph.h
+SYMLINK-$(CONFIG_RTE_LIBRTE_GRAPH)-include += rte_graph_worker.h
 
 include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index 4c3f2fe7b..e1930b7d2 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -2,6 +2,7 @@
  * Copyright(C) 2020 Marvell International Ltd.
  */
 
+#include 
 #include 
 
 #include "graph_private.h"
@@ -19,3 +20,18 @@ graph_spinlock_unlock(void)
 {
rte_spinlock_unlock(&graph_lock);
 }
+
+void __rte_noinline
+__rte_node_stream_alloc(struct rte_graph *graph, struct rte_node *node)
+{
+   uint16_t size = node->size;
+
+   RTE_VERIFY(size != UINT16_MAX);
+   /* Allocate double amount of size to avoid immediate realloc */
+   size = RTE_MIN(UINT16_MAX, RTE_MAX(RTE_GRAPH_BURST_SIZE, size * 2));
+   node->objs = rte_realloc_socket(node->objs, size * sizeof(void *),
+   RTE_CACHE_LINE_SIZE, graph->socket);
+   RTE_VERIFY(node->objs);
+   node->size = size;
+   node->realloc_count++;
+}
diff --git a/lib/librte_graph/graph_populate.c 
b/lib/librte_graph/graph_populate.c
new file mode 100644
index 0..093512efa
--- /dev/null
+++ b/lib/librte_graph/graph_populate.c
@@ -0,0 +1,234 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+
+#include "graph_private.h"
+
+static size_t
+graph_fp_mem_calc_size(struct graph *graph)
+{
+   struct graph_node *graph_node;
+   rte_node_t val;
+   size_t sz;
+
+   /* Graph header */
+   sz = sizeof(struct rte_graph);
+   /* Source nodes list */
+   sz += sizeof(rte_graph_off_t) * graph->src_node_count;
+   /* Circular buffer for pending streams of size number of nodes */
+   val = rte_align32pow2(graph->node_count * sizeof(rte_graph_off_t));
+   sz = RTE_ALIGN(sz, val);
+   graph->cir_start = sz;
+   graph->cir_mask = rte_align32pow2(graph->node_count) - 1;
+   sz += val;
+   /* Fence */
+   sz += sizeof(RTE_GRAPH_FENCE);
+   sz = RTE_ALIGN(sz, RTE_CACHE_LINE_SIZE);
+   graph->nodes_start = sz;
+   /* For 0..N node objects with fence */
+   STAILQ_FOREACH(graph_node, &graph->node_list, next) {
+   sz = RTE_ALIGN(sz, RTE_CACHE_LINE_SIZE);
+   sz += sizeof(struct rte_node);
+   /* Pointer to next nodes(edges) */
+   sz += sizeof(struct rte_node *) * graph_node->node->nb_edges;
+   }
+
+   graph->mem_sz = sz;
+   return sz;
+}
+
+static void
+graph_header_popluate(struct graph *_graph)
+{
+   struct rte_graph *graph = _graph->graph;
+
+   graph->tail = 0;
+   graph->head = (int32_t)-_graph->src_node_count;
+   graph->cir_mask = _graph->cir_mask;
+   graph->nb_nodes = _graph->node_count;
+   graph->cir_start = RTE_PTR_ADD(graph, _graph->cir_start);
+   graph->nodes_start = _graph->nodes_start;
+   graph->socket = _graph->socket;
+   graph->id = _graph->

[dpdk-dev] [PATCH v5 11/29] graph: implement stats support

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding implementation for graph stats collection API. This API will
create a cluster for a specified node pattern and aggregate the node
runtime stats.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/Makefile  |   1 +
 lib/librte_graph/graph_stats.c | 406 +
 lib/librte_graph/meson.build   |   2 +-
 lib/librte_graph/rte_graph_version.map |   5 +
 4 files changed, 413 insertions(+), 1 deletion(-)
 create mode 100644 lib/librte_graph/graph_stats.c

diff --git a/lib/librte_graph/Makefile b/lib/librte_graph/Makefile
index 7bfd7d51f..967c8d9bc 100644
--- a/lib/librte_graph/Makefile
+++ b/lib/librte_graph/Makefile
@@ -18,6 +18,7 @@ SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += node.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_ops.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_debug.c
+SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_stats.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_populate.c
 
 # install header files
diff --git a/lib/librte_graph/graph_stats.c b/lib/librte_graph/graph_stats.c
new file mode 100644
index 0..125e08d73
--- /dev/null
+++ b/lib/librte_graph/graph_stats.c
@@ -0,0 +1,406 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+
+#include 
+#include 
+#include 
+
+#include "graph_private.h"
+
+/* Capture all graphs of cluster */
+struct cluster {
+   rte_graph_t nb_graphs;
+   rte_graph_t size;
+
+   struct graph **graphs;
+};
+
+/* Capture same node ID across cluster  */
+struct cluster_node {
+   struct rte_graph_cluster_node_stats stat;
+   rte_node_t nb_nodes;
+
+   struct rte_node *nodes[];
+};
+
+struct rte_graph_cluster_stats {
+   /* Header */
+   rte_graph_cluster_stats_cb_t fn;
+   uint32_t cluster_node_size; /* Size of struct cluster_node */
+   rte_node_t max_nodes;
+   int socket_id;
+   void *cookie;
+   size_t sz;
+
+   struct cluster_node clusters[];
+} __rte_cache_aligned;
+
+#define boarder()  
\
+   fprintf(f, "+---+---+" \
+  "---+---+---+---+-" \
+  "--+\n")
+
+static inline void
+print_banner(FILE *f)
+{
+   boarder();
+   fprintf(f, "%-32s%-16s%-16s%-16s%-16s%-16s%-16s\n", "|Node", "|calls",
+   "|objs", "|realloc_count", "|objs/call", "|objs/sec(10E6)",
+   "|cycles/call|");
+   boarder();
+}
+
+static inline void
+print_node(FILE *f, const struct rte_graph_cluster_node_stats *stat)
+{
+   double objs_per_call, objs_per_sec, cycles_per_call, ts_per_hz;
+   const uint64_t prev_calls = stat->prev_calls;
+   const uint64_t prev_objs = stat->prev_objs;
+   const uint64_t cycles = stat->cycles;
+   const uint64_t calls = stat->calls;
+   const uint64_t objs = stat->objs;
+   uint64_t call_delta;
+
+   call_delta = calls - prev_calls;
+   objs_per_call =
+   call_delta ? (double)((objs - prev_objs) / call_delta) : 0;
+   cycles_per_call =
+   call_delta ? (double)((cycles - stat->prev_cycles) / call_delta)
+  : 0;
+   ts_per_hz = (double)((stat->ts - stat->prev_ts) / stat->hz);
+   objs_per_sec = ts_per_hz ? (objs - prev_objs) / ts_per_hz : 0;
+   objs_per_sec /= 100;
+
+   fprintf(f,
+   "|%-31s|%-15" PRIu64 "|%-15" PRIu64 "|%-15" PRIu64
+   "|%-15.3f|%-15.6f|%-11.4f|\n",
+   stat->name, calls, objs, stat->realloc_count, objs_per_call,
+   objs_per_sec, cycles_per_call);
+}
+
+static int
+graph_cluster_stats_cb(bool is_first, bool is_last, void *cookie,
+  const struct rte_graph_cluster_node_stats *stat)
+{
+   FILE *f = cookie;
+
+   if (unlikely(is_first))
+   print_banner(f);
+   if (stat->objs)
+   print_node(f, stat);
+   if (unlikely(is_last))
+   boarder();
+
+   return 0;
+};
+
+static struct rte_graph_cluster_stats *
+stats_mem_init(struct cluster *cluster,
+  const struct rte_graph_cluster_stats_param *prm)
+{
+   size_t sz = sizeof(struct rte_graph_cluster_stats);
+   struct rte_graph_cluster_stats *stats;
+   rte_graph_cluster_stats_cb_t fn;
+   int socket_id = prm->socket_id;
+   uint32_t cluster_node_size;
+
+   /* Fix up callback */
+   fn = prm->fn;
+   if (fn == NULL)
+   fn = graph_cluster_stats_cb;
+
+   cluster_node_size = sizeof(struct cluster_node);
+   /* For a given cluster, max nodes will be the max number of graphs */
+   cluster_node_size += cluster->nb_graphs * sizeof(struct rte_node *);
+   cluster_nod

[dpdk-dev] [PATCH v5 07/29] graph: implement create and destroy APIs

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding graph specific API implementations like graph create
and graph destroy. This detect loops in the graph,
check for isolated nodes and operation to verify the validity of
graph.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/graph.c   | 319 +
 lib/librte_graph/rte_graph_version.map |   2 +
 2 files changed, 321 insertions(+)

diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index e1930b7d2..f4e02fdfc 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -2,13 +2,33 @@
  * Copyright(C) 2020 Marvell International Ltd.
  */
 
+#include 
+#include 
+
+#include 
+#include 
+#include 
 #include 
+#include 
 #include 
+#include 
 
 #include "graph_private.h"
 
+static struct graph_head graph_list = STAILQ_HEAD_INITIALIZER(graph_list);
 static rte_spinlock_t graph_lock = RTE_SPINLOCK_INITIALIZER;
+static rte_graph_t graph_id;
 int rte_graph_logtype;
+
+#define GRAPH_ID_CHECK(id) ID_CHECK(id, graph_id)
+
+/* Private functions */
+struct graph_head *
+graph_list_head_get(void)
+{
+   return &graph_list;
+}
+
 void
 graph_spinlock_lock(void)
 {
@@ -21,6 +41,305 @@ graph_spinlock_unlock(void)
rte_spinlock_unlock(&graph_lock);
 }
 
+static int
+graph_node_add(struct graph *graph, struct node *node)
+{
+   struct graph_node *graph_node;
+   size_t sz;
+
+   /* Skip the duplicate nodes */
+   STAILQ_FOREACH(graph_node, &graph->node_list, next)
+   if (strncmp(node->name, graph_node->node->name,
+   RTE_NODE_NAMESIZE) == 0)
+   return 0;
+
+   /* Allocate new graph node object */
+   sz = sizeof(*graph_node) + node->nb_edges * sizeof(struct node *);
+   graph_node = calloc(1, sz);
+
+   if (graph_node == NULL)
+   SET_ERR_JMP(ENOMEM, free, "Failed to calloc %s object",
+   node->name);
+
+   /* Initialize the graph node */
+   graph_node->node = node;
+
+   /* Add to graph node list */
+   STAILQ_INSERT_TAIL(&graph->node_list, graph_node, next);
+   return 0;
+
+free:
+   free(graph_node);
+   return -rte_errno;
+}
+
+static struct graph_node *
+node_to_graph_node(struct graph *graph, struct node *node)
+{
+   struct graph_node *graph_node;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next)
+   if (graph_node->node == node)
+   return graph_node;
+
+   SET_ERR_JMP(ENODEV, fail, "Found isolated node %s", node->name);
+fail:
+   return NULL;
+}
+
+static int
+graph_node_edges_add(struct graph *graph)
+{
+   struct graph_node *graph_node;
+   struct node *adjacency;
+   const char *next;
+   rte_edge_t i;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next) {
+   for (i = 0; i < graph_node->node->nb_edges; i++) {
+   next = graph_node->node->next_nodes[i];
+   adjacency = node_from_name(next);
+   if (adjacency == NULL)
+   SET_ERR_JMP(EINVAL, fail,
+   "Node %s not registered", next);
+   if (graph_node_add(graph, adjacency))
+   goto fail;
+   }
+   }
+   return 0;
+fail:
+   return -rte_errno;
+}
+
+static int
+graph_adjacency_list_update(struct graph *graph)
+{
+   struct graph_node *graph_node, *tmp;
+   struct node *adjacency;
+   const char *next;
+   rte_edge_t i;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next) {
+   for (i = 0; i < graph_node->node->nb_edges; i++) {
+   next = graph_node->node->next_nodes[i];
+   adjacency = node_from_name(next);
+   if (adjacency == NULL)
+   SET_ERR_JMP(EINVAL, fail,
+   "Node %s not registered", next);
+   tmp = node_to_graph_node(graph, adjacency);
+   if (tmp == NULL)
+   goto fail;
+   graph_node->adjacency_list[i] = tmp;
+   }
+   }
+
+   return 0;
+fail:
+   return -rte_errno;
+}
+
+static int
+expand_pattern_to_node(struct graph *graph, const char *pattern)
+{
+   struct node_head *node_head = node_list_head_get();
+   bool found = false;
+   struct node *node;
+
+   /* Check for pattern match */
+   STAILQ_FOREACH(node, node_head, next) {
+   if (fnmatch(pattern, node->name, 0) == 0) {
+   if (graph_node_add(graph, node))
+   goto fail;
+   found = true;
+   }
+   }
+   if (found == false)
+   SET_ERR_JMP(EFAULT, fail, "Pattern 

[dpdk-dev] [PATCH v5 08/29] graph: implement graph operation APIs

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding support for graph specific API implementation like
Graph lookup to get graph object, retrieving graph ID
>From name and graph name from ID.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/graph.c   | 131 +
 lib/librte_graph/rte_graph_version.map |   8 ++
 2 files changed, 139 insertions(+)

diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index f4e02fdfc..7a77cb5c8 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -210,6 +210,54 @@ graph_node_fini(struct graph *graph)
   graph_node->node->name));
 }
 
+static struct rte_graph *
+graph_mem_fixup_node_ctx(struct rte_graph *graph)
+{
+   struct rte_node *node;
+   struct node *node_db;
+   rte_graph_off_t off;
+   rte_node_t count;
+   const char *name;
+
+   rte_graph_foreach_node(count, off, graph, node) {
+   if (node->parent_id == RTE_NODE_ID_INVALID) /* Static node */
+   name = node->name;
+   else /* Cloned node */
+   name = node->parent;
+
+   node_db = node_from_name(name);
+   if (node_db == NULL)
+   SET_ERR_JMP(ENOLINK, fail, "Node %s not found", name);
+   node->process = node_db->process;
+   }
+
+   return graph;
+fail:
+   return NULL;
+}
+
+static struct rte_graph *
+graph_mem_fixup_secondary(struct rte_graph *graph)
+{
+   if (graph == NULL || rte_eal_process_type() == RTE_PROC_PRIMARY)
+   return graph;
+
+   return graph_mem_fixup_node_ctx(graph);
+}
+
+struct rte_graph *
+rte_graph_lookup(const char *name)
+{
+   const struct rte_memzone *mz;
+   struct rte_graph *rc = NULL;
+
+   mz = rte_memzone_lookup(name);
+   if (mz)
+   rc = mz->addr;
+
+   return graph_mem_fixup_secondary(rc);
+}
+
 rte_graph_t
 rte_graph_create(const char *name, struct rte_graph_param *prm)
 {
@@ -340,6 +388,76 @@ rte_graph_destroy(rte_graph_t id)
return rc;
 }
 
+rte_graph_t
+rte_graph_from_name(const char *name)
+{
+   struct graph *graph;
+
+   STAILQ_FOREACH(graph, &graph_list, next)
+   if (strncmp(graph->name, name, RTE_GRAPH_NAMESIZE) == 0)
+   return graph->id;
+
+   return RTE_GRAPH_ID_INVALID;
+}
+
+char *
+rte_graph_id_to_name(rte_graph_t id)
+{
+   struct graph *graph;
+
+   GRAPH_ID_CHECK(id);
+   STAILQ_FOREACH(graph, &graph_list, next)
+   if (graph->id == id)
+   return graph->name;
+
+fail:
+   return NULL;
+}
+
+struct rte_node *
+rte_graph_node_get(rte_graph_t gid, uint32_t nid)
+{
+   struct rte_node *node;
+   struct graph *graph;
+   rte_graph_off_t off;
+   rte_node_t count;
+
+   GRAPH_ID_CHECK(gid);
+   STAILQ_FOREACH(graph, &graph_list, next)
+   if (graph->id == gid) {
+   rte_graph_foreach_node(count, off, graph->graph,
+   node) {
+   if (node->id == nid)
+   return node;
+   }
+   break;
+   }
+fail:
+   return NULL;
+}
+
+struct rte_node *
+rte_graph_node_get_by_name(const char *graph_name, const char *node_name)
+{
+   struct rte_node *node;
+   struct graph *graph;
+   rte_graph_off_t off;
+   rte_node_t count;
+
+   STAILQ_FOREACH(graph, &graph_list, next)
+   if (!strncmp(graph->name, graph_name, RTE_GRAPH_NAMESIZE)) {
+   rte_graph_foreach_node(count, off, graph->graph,
+   node) {
+   if (!strncmp(node->name, node_name,
+RTE_NODE_NAMESIZE))
+   return node;
+   }
+   break;
+   }
+
+   return NULL;
+}
+
 void __rte_noinline
 __rte_node_stream_alloc(struct rte_graph *graph, struct rte_node *node)
 {
@@ -354,3 +472,16 @@ __rte_node_stream_alloc(struct rte_graph *graph, struct 
rte_node *node)
node->size = size;
node->realloc_count++;
 }
+
+rte_graph_t
+rte_graph_max_count(void)
+{
+   return graph_id;
+}
+
+RTE_INIT(rte_graph_init_log)
+{
+   rte_graph_logtype = rte_log_register("lib.graph");
+   if (rte_graph_logtype >= 0)
+   rte_log_set_level(rte_graph_logtype, RTE_LOG_INFO);
+}
diff --git a/lib/librte_graph/rte_graph_version.map 
b/lib/librte_graph/rte_graph_version.map
index dcbd78c02..5a2b13293 100644
--- a/lib/librte_graph/rte_graph_version.map
+++ b/lib/librte_graph/rte_graph_version.map
@@ -6,6 +6,14 @@ EXPERIMENTAL {
 
rte_graph_create;
rte_gr

[dpdk-dev] [PATCH v5 05/29] graph: implement internal graph operation helpers

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding internal graph API helpers support to check whether a graph has
isolated nodes and any node have a loop to itself and BFS
algorithm implementation etc.

Signed-off-by: Jerin Jacob 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/Makefile|   1 +
 lib/librte_graph/graph.c |   2 +-
 lib/librte_graph/graph_ops.c | 169 ++
 lib/librte_graph/graph_private.h | 173 +++
 lib/librte_graph/meson.build |   2 +-
 5 files changed, 345 insertions(+), 2 deletions(-)
 create mode 100644 lib/librte_graph/graph_ops.c

diff --git a/lib/librte_graph/Makefile b/lib/librte_graph/Makefile
index 2a6d86933..39ecb2652 100644
--- a/lib/librte_graph/Makefile
+++ b/lib/librte_graph/Makefile
@@ -16,6 +16,7 @@ EXPORT_MAP := rte_graph_version.map
 # all source are stored in SRCS-y
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += node.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph.c
+SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_ops.c
 SRCS-$(CONFIG_RTE_LIBRTE_GRAPH) += graph_debug.c
 
 # install header files
diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index a9c124896..4c3f2fe7b 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -7,7 +7,7 @@
 #include "graph_private.h"
 
 static rte_spinlock_t graph_lock = RTE_SPINLOCK_INITIALIZER;
-
+int rte_graph_logtype;
 void
 graph_spinlock_lock(void)
 {
diff --git a/lib/librte_graph/graph_ops.c b/lib/librte_graph/graph_ops.c
new file mode 100644
index 0..335595311
--- /dev/null
+++ b/lib/librte_graph/graph_ops.c
@@ -0,0 +1,169 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+
+#include 
+#include 
+
+#include "graph_private.h"
+
+/* Check whether a node has next_node to itself */
+static inline int
+node_has_loop_edge(struct node *node)
+{
+   rte_edge_t i;
+   char *name;
+   int rc = 0;
+
+   for (i = 0; i < node->nb_edges; i++) {
+   if (strncmp(node->name, node->next_nodes[i],
+   RTE_NODE_NAMESIZE) == 0) {
+   name = node->name;
+   rc = 1;
+   SET_ERR_JMP(EINVAL, fail, "Node %s has loop to self",
+   name);
+   }
+   }
+fail:
+   return rc;
+}
+
+int
+graph_node_has_loop_edge(struct graph *graph)
+{
+   struct graph_node *graph_node;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next)
+   if (node_has_loop_edge(graph_node->node))
+   return 1;
+
+   return 0;
+}
+
+rte_node_t
+graph_src_nodes_count(struct graph *graph)
+{
+   struct graph_node *graph_node;
+   rte_node_t rc = 0;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next)
+   if (graph_node->node->flags & RTE_NODE_SOURCE_F)
+   rc++;
+
+   if (rc == 0)
+   SET_ERR_JMP(EINVAL, fail, "Graph needs at least a source node");
+fail:
+   return rc;
+}
+
+/* Check whether a node has next_node to a source node */
+int
+graph_node_has_edge_to_src_node(struct graph *graph)
+{
+   struct graph_node *graph_node;
+   struct node *node;
+   rte_edge_t i;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next) {
+   for (i = 0; i < graph_node->node->nb_edges; i++) {
+   node = graph_node->adjacency_list[i]->node;
+   if (node->flags & RTE_NODE_SOURCE_F)
+   SET_ERR_JMP(
+   EEXIST, fail,
+   "Node %s points to the source node %s",
+   graph_node->node->name, node->name);
+   }
+   }
+
+   return 0;
+fail:
+   return 1;
+}
+
+rte_node_t
+graph_nodes_count(struct graph *graph)
+{
+   struct graph_node *graph_node;
+   rte_node_t count = 0;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next)
+   count++;
+
+   return count;
+}
+
+void
+graph_mark_nodes_as_not_visited(struct graph *graph)
+{
+   struct graph_node *graph_node;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next)
+   graph_node->visited = false;
+}
+
+int
+graph_bfs(struct graph *graph, struct graph_node *start)
+{
+   struct graph_node **queue, *v, *tmp;
+   uint16_t head = 0, tail = 0;
+   rte_edge_t i;
+   size_t sz;
+
+   sz = sizeof(struct graph_node *) * graph_nodes_count(graph);
+   queue = malloc(sz);
+   if (queue == NULL)
+   SET_ERR_JMP(ENOMEM, fail, "Failed to alloc BFS queue of %zu",
+   sz);
+
+   /* BFS algorithm */
+   queue[tail++] = start;
+   start->visited = true;
+   while (head != tail) {
+   v = queue[head++];
+   for (i = 0; i < v->node->nb_edges; i++) {
+   tmp = v->adj

[dpdk-dev] [PATCH v5 09/29] graph: implement Graphviz export

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding API implementation support exporting the graph object to file.
This will export the graph to a file in Graphviz format.
It can be viewed in many viewers such as
https://dreampuf.github.io/GraphvizOnline/

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/graph.c   | 53 ++
 lib/librte_graph/rte_graph_version.map |  1 +
 2 files changed, 54 insertions(+)

diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index 7a77cb5c8..61e212e03 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -473,6 +473,59 @@ __rte_node_stream_alloc(struct rte_graph *graph, struct 
rte_node *node)
node->realloc_count++;
 }
 
+static int
+graph_to_dot(FILE *f, struct graph *graph)
+{
+   const char *src_edge_color = " [color=blue]\n";
+   const char *edge_color = "\n";
+   struct graph_node *graph_node;
+   char *node_name;
+   rte_edge_t i;
+   int rc;
+
+   rc = fprintf(f, "Digraph %s {\n\trankdir=LR;\n", graph->name);
+   if (rc < 0)
+   goto end;
+
+   STAILQ_FOREACH(graph_node, &graph->node_list, next) {
+   node_name = graph_node->node->name;
+   for (i = 0; i < graph_node->node->nb_edges; i++) {
+   rc = fprintf(f, "\t\"%s\"->\"%s\"%s", node_name,
+graph_node->adjacency_list[i]->node->name,
+graph_node->node->flags & RTE_NODE_SOURCE_F
+? src_edge_color
+: edge_color);
+   if (rc < 0)
+   goto end;
+   }
+   }
+   rc = fprintf(f, "}\n");
+   if (rc < 0)
+   goto end;
+
+   return 0;
+end:
+   rte_errno = EBADF;
+   return -rte_errno;
+}
+
+int
+rte_graph_export(const char *name, FILE *f)
+{
+   struct graph *graph;
+   int rc = ENOENT;
+
+   STAILQ_FOREACH(graph, &graph_list, next) {
+   if (strncmp(graph->name, name, RTE_GRAPH_NAMESIZE) == 0) {
+   rc = graph_to_dot(f, graph);
+   goto end;
+   }
+   }
+end:
+   return -rc;
+}
+
+
 rte_graph_t
 rte_graph_max_count(void)
 {
diff --git a/lib/librte_graph/rte_graph_version.map 
b/lib/librte_graph/rte_graph_version.map
index 5a2b13293..2797be044 100644
--- a/lib/librte_graph/rte_graph_version.map
+++ b/lib/librte_graph/rte_graph_version.map
@@ -6,6 +6,7 @@ EXPERIMENTAL {
 
rte_graph_create;
rte_graph_destroy;
+   rte_graph_export;
rte_graph_from_name;
rte_graph_id_to_name;
rte_graph_lookup;
-- 
2.25.1



[dpdk-dev] [PATCH v5 12/29] graph: implement fastpath API routines

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding implementation for rte_graph_walk() API. This will perform a walk
on the circular buffer and call the process function of each node
and collect the stats if stats collection is enabled.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 doc/api/doxy-api-index.md  |   1 +
 lib/librte_graph/graph.c   |  16 +
 lib/librte_graph/rte_graph_version.map |  10 +
 lib/librte_graph/rte_graph_worker.h| 404 +
 4 files changed, 431 insertions(+)

diff --git a/doc/api/doxy-api-index.md b/doc/api/doxy-api-index.md
index 5cc50f750..fd2ff64d7 100644
--- a/doc/api/doxy-api-index.md
+++ b/doc/api/doxy-api-index.md
@@ -160,6 +160,7 @@ The public API headers are grouped by topics:
 [port_in_action]   (@ref rte_port_in_action.h)
 [table_action] (@ref rte_table_action.h)
   * [graph](@ref rte_graph.h):
+[graph_worker] (@ref rte_graph_worker.h)
 
 - **basic**:
   [approx fraction](@ref rte_approx.h),
diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index e811a7b38..0ea83df3d 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -473,6 +473,22 @@ __rte_node_stream_alloc(struct rte_graph *graph, struct 
rte_node *node)
node->realloc_count++;
 }
 
+void __rte_noinline
+__rte_node_stream_alloc_size(struct rte_graph *graph, struct rte_node *node,
+uint16_t req_size)
+{
+   uint16_t size = node->size;
+
+   RTE_VERIFY(size != UINT16_MAX);
+   /* Allocate double amount of size to avoid immediate realloc */
+   size = RTE_MIN(UINT16_MAX, RTE_MAX(RTE_GRAPH_BURST_SIZE, req_size * 2));
+   node->objs = rte_realloc_socket(node->objs, size * sizeof(void *),
+   RTE_CACHE_LINE_SIZE, graph->socket);
+   RTE_VERIFY(node->objs);
+   node->size = size;
+   node->realloc_count++;
+}
+
 static int
 graph_to_dot(FILE *f, struct graph *graph)
 {
diff --git a/lib/librte_graph/rte_graph_version.map 
b/lib/librte_graph/rte_graph_version.map
index adf55d406..13b838752 100644
--- a/lib/librte_graph/rte_graph_version.map
+++ b/lib/librte_graph/rte_graph_version.map
@@ -3,6 +3,7 @@ EXPERIMENTAL {
 
__rte_node_register;
__rte_node_stream_alloc;
+   __rte_node_stream_alloc_size;
 
rte_graph_create;
rte_graph_destroy;
@@ -16,6 +17,7 @@ EXPERIMENTAL {
rte_graph_node_get;
rte_graph_node_get_by_name;
rte_graph_obj_dump;
+   rte_graph_walk;
 
rte_graph_cluster_stats_create;
rte_graph_cluster_stats_destroy;
@@ -28,10 +30,18 @@ EXPERIMENTAL {
rte_node_edge_get;
rte_node_edge_shrink;
rte_node_edge_update;
+   rte_node_enqueue;
+   rte_node_enqueue_x1;
+   rte_node_enqueue_x2;
+   rte_node_enqueue_x4;
+   rte_node_enqueue_next;
rte_node_from_name;
rte_node_id_to_name;
rte_node_list_dump;
rte_node_max_count;
+   rte_node_next_stream_get;
+   rte_node_next_stream_put;
+   rte_node_next_stream_move;
 
local: *;
 };
diff --git a/lib/librte_graph/rte_graph_worker.h 
b/lib/librte_graph/rte_graph_worker.h
index 42be8fd13..4c3ddcbde 100644
--- a/lib/librte_graph/rte_graph_worker.h
+++ b/lib/librte_graph/rte_graph_worker.h
@@ -99,6 +99,410 @@ struct rte_node {
 __rte_experimental
 void __rte_node_stream_alloc(struct rte_graph *graph, struct rte_node *node);
 
+/**
+ * @internal
+ *
+ * Allocate a stream with requested number of objects.
+ *
+ * If stream already exists then re-allocate it to a larger size.
+ *
+ * @param graph
+ *   Pointer to the graph object.
+ * @param node
+ *   Pointer to the node object.
+ * @param req_size
+ *   Number of objects to be allocated.
+ */
+__rte_experimental
+void __rte_node_stream_alloc_size(struct rte_graph *graph,
+ struct rte_node *node, uint16_t req_size);
+
+/**
+ * Perform graph walk on the circular buffer and invoke the process function
+ * of the nodes and collect the stats.
+ *
+ * @param graph
+ *   Graph pointer returned from rte_graph_lookup function.
+ *
+ * @see rte_graph_lookup()
+ */
+__rte_experimental
+static inline void
+rte_graph_walk(struct rte_graph *graph)
+{
+   const rte_graph_off_t *cir_start = graph->cir_start;
+   const rte_node_t mask = graph->cir_mask;
+   uint32_t head = graph->head;
+   struct rte_node *node;
+   uint64_t start;
+   uint16_t rc;
+   void **objs;
+
+   /*
+* Walk on the source node(s) ((cir_start - head) -> cir_start) and then
+* on the pending streams (cir_start -> (cir_start + mask) -> cir_start)
+* in a circular buffer fashion.
+*
+*  +-+ <= cir_start - head [number of source nodes]
+*  | |
+*  | ... | <= source nodes
+*  | |
+*

[dpdk-dev] [PATCH v5 13/29] graph: add unit test case

2020-04-11 Thread jerinj
From: Kiran Kumar K 

Adding the unit test to test the functionality of node and graph APIs.
Testing includes registering a node, cloning a node, creating a graph,
perform graph walk, collecting stats and all node and graph debug APIs.

example command to test:
echo "graph_autotest" | sudo ./build/app/test/dpdk-test -c 0x30

Signed-off-by: Kiran Kumar K 
Signed-off-by: Nithin Dabilpuram 
---
 app/test/Makefile |   6 +
 app/test/meson.build  |   6 +-
 app/test/test_graph.c | 819 ++
 3 files changed, 830 insertions(+), 1 deletion(-)
 create mode 100644 app/test/test_graph.c

diff --git a/app/test/Makefile b/app/test/Makefile
index 1f080d162..ce2e08e12 100644
--- a/app/test/Makefile
+++ b/app/test/Makefile
@@ -221,6 +221,10 @@ SRCS-y += test_event_timer_adapter.c
 SRCS-y += test_event_crypto_adapter.c
 endif
 
+ifeq ($(CONFIG_RTE_LIBRTE_GRAPH), y)
+SRCS-y += test_graph.c
+endif
+
 ifeq ($(CONFIG_RTE_LIBRTE_RAWDEV),y)
 SRCS-y += test_rawdev.c
 endif
@@ -240,6 +244,8 @@ endif
 CFLAGS += -DALLOW_EXPERIMENTAL_API
 
 CFLAGS += -O3
+# Strict-aliasing rules are violated by uint8_t[] to context size casts.
+CFLAGS += -fno-strict-aliasing
 CFLAGS += $(WERROR_FLAGS)
 
 LDLIBS += -lm
diff --git a/app/test/meson.build b/app/test/meson.build
index 351d29cb6..3cf850584 100644
--- a/app/test/meson.build
+++ b/app/test/meson.build
@@ -51,6 +51,7 @@ test_sources = files('commands.c',
'test_fib6_perf.c',
'test_func_reentrancy.c',
'test_flow_classify.c',
+   'test_graph.c',
'test_hash.c',
'test_hash_functions.c',
'test_hash_multiwriter.c',
@@ -151,7 +152,8 @@ test_deps = ['acl',
'rib',
'ring',
'stack',
-   'timer'
+   'timer',
+   'graph'
 ]
 
 # Each test is marked with flag true/false
@@ -362,6 +364,8 @@ endif
 
 # specify -D_GNU_SOURCE unconditionally
 cflags += '-D_GNU_SOURCE'
+# Strict-aliasing rules are violated by uint8_t[] to context size casts.
+cflags += '-fno-strict-aliasing'
 
 test_dep_objs = []
 if dpdk_conf.has('RTE_LIBRTE_COMPRESSDEV')
diff --git a/app/test/test_graph.c b/app/test/test_graph.c
new file mode 100644
index 0..f5c957f82
--- /dev/null
+++ b/app/test/test_graph.c
@@ -0,0 +1,819 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+
+#include "test.h"
+
+static uint16_t test_node_worker_source(struct rte_graph *graph,
+   struct rte_node *node, void **objs,
+   uint16_t nb_objs);
+
+static uint16_t test_node0_worker(struct rte_graph *graph,
+ struct rte_node *node, void **objs,
+ uint16_t nb_objs);
+
+static uint16_t test_node1_worker(struct rte_graph *graph,
+ struct rte_node *node, void **objs,
+ uint16_t nb_objs);
+
+static uint16_t test_node2_worker(struct rte_graph *graph,
+ struct rte_node *node, void **objs,
+ uint16_t nb_objs);
+
+static uint16_t test_node3_worker(struct rte_graph *graph,
+ struct rte_node *node, void **objs,
+ uint16_t nb_objs);
+
+#define MBUFF_SIZE 512
+#define MAX_NODES  4
+
+static struct rte_mbuf mbuf[MAX_NODES + 1][MBUFF_SIZE];
+static void *mbuf_p[MAX_NODES + 1][MBUFF_SIZE];
+static rte_graph_t graph_id;
+static uint64_t obj_stats[MAX_NODES + 1];
+static uint64_t fn_calls[MAX_NODES + 1];
+
+const char *node_patterns[] = {
+   "test_node_source1",   "test_node00",
+   "test_node00-test_node11", "test_node00-test_node22",
+   "test_node00-test_node33",
+};
+
+const char *node_names[] = {
+   "test_node00",
+   "test_node00-test_node11",
+   "test_node00-test_node22",
+   "test_node00-test_node33",
+};
+
+struct test_node_register {
+   char name[RTE_NODE_NAMESIZE];
+   rte_node_process_t process;
+   uint16_t nb_edges;
+   const char *next_nodes[MAX_NODES];
+};
+
+typedef struct {
+   uint32_t idx;
+   struct test_node_register node;
+} test_node_t;
+
+typedef struct {
+   test_node_t test_node[MAX_NODES];
+} test_main_t;
+
+static test_main_t test_main = {
+   .test_node = {
+   {
+   .node = {
+   .name = "test_node00",
+   .process = test_node0_worker,
+   .nb_edges = 2,
+   .next_nodes = {"test_node00-"
+  "test_node11",
+  "test_node00-"
+  "test_node22"},
+   

[dpdk-dev] [PATCH v5 10/29] graph: implement debug routines

2020-04-11 Thread jerinj
From: Jerin Jacob 

Adding implementation for graph specific API to dump the
Graph information to a file. This API will dump detailed internal
info about node objects and graph objects.

Signed-off-by: Jerin Jacob 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_graph/graph.c   | 31 ++
 lib/librte_graph/graph_debug.c | 59 ++
 lib/librte_graph/graph_private.h   | 13 ++
 lib/librte_graph/rte_graph_version.map |  2 +
 4 files changed, 105 insertions(+)

diff --git a/lib/librte_graph/graph.c b/lib/librte_graph/graph.c
index 61e212e03..e811a7b38 100644
--- a/lib/librte_graph/graph.c
+++ b/lib/librte_graph/graph.c
@@ -525,6 +525,37 @@ rte_graph_export(const char *name, FILE *f)
return -rc;
 }
 
+static void
+graph_scan_dump(FILE *f, rte_graph_t id, bool all)
+{
+   struct graph *graph;
+
+   RTE_VERIFY(f);
+   GRAPH_ID_CHECK(id);
+
+   STAILQ_FOREACH(graph, &graph_list, next) {
+   if (all == true) {
+   graph_dump(f, graph);
+   } else if (graph->id == id) {
+   graph_dump(f, graph);
+   return;
+   }
+   }
+fail:
+   return;
+}
+
+void
+rte_graph_dump(FILE *f, rte_graph_t id)
+{
+   graph_scan_dump(f, id, false);
+}
+
+void
+rte_graph_list_dump(FILE *f)
+{
+   graph_scan_dump(f, 0, true);
+}
 
 rte_graph_t
 rte_graph_max_count(void)
diff --git a/lib/librte_graph/graph_debug.c b/lib/librte_graph/graph_debug.c
index 75238e7ca..f8aea16ac 100644
--- a/lib/librte_graph/graph_debug.c
+++ b/lib/librte_graph/graph_debug.c
@@ -7,6 +7,26 @@
 
 #include "graph_private.h"
 
+void
+graph_dump(FILE *f, struct graph *g)
+{
+   struct graph_node *graph_node;
+   rte_edge_t i = 0;
+
+   fprintf(f, "graph <%s>\n", g->name);
+   fprintf(f, "  id=%" PRIu32 "\n", g->id);
+   fprintf(f, "  cir_start=%" PRIu32 "\n", g->cir_start);
+   fprintf(f, "  cir_mask=%" PRIu32 "\n", g->cir_mask);
+   fprintf(f, "  addr=%p\n", g);
+   fprintf(f, "  graph=%p\n", g->graph);
+   fprintf(f, "  mem_sz=%zu\n", g->mem_sz);
+   fprintf(f, "  node_count=%" PRIu32 "\n", g->node_count);
+   fprintf(f, "  src_node_count=%" PRIu32 "\n", g->src_node_count);
+
+   STAILQ_FOREACH(graph_node, &g->node_list, next)
+   fprintf(f, " node[%d] <%s>\n", i++, graph_node->node->name);
+}
+
 void
 node_dump(FILE *f, struct node *n)
 {
@@ -23,3 +43,42 @@ node_dump(FILE *f, struct node *n)
fprintf(f, " edge[%d] <%s>\n", i, n->next_nodes[i]);
 }
 
+void
+rte_graph_obj_dump(FILE *f, struct rte_graph *g, bool all)
+{
+   rte_node_t count;
+   rte_graph_off_t off;
+   struct rte_node *n;
+   rte_edge_t i;
+
+   fprintf(f, "graph <%s> @ %p\n", g->name, g);
+   fprintf(f, "  id=%" PRIu32 "\n", g->id);
+   fprintf(f, "  head=%" PRId32 "\n", (int32_t)g->head);
+   fprintf(f, "  tail=%" PRId32 "\n", (int32_t)g->tail);
+   fprintf(f, "  cir_mask=0x%" PRIx32 "\n", g->cir_mask);
+   fprintf(f, "  nb_nodes=%" PRId32 "\n", g->nb_nodes);
+   fprintf(f, "  socket=%d\n", g->socket);
+   fprintf(f, "  fence=0x%" PRIx64 "\n", g->fence);
+   fprintf(f, "  nodes_start=0x%" PRIx32 "\n", g->nodes_start);
+   fprintf(f, "  cir_start=%p\n", g->cir_start);
+
+   rte_graph_foreach_node(count, off, g, n) {
+   if (!all && n->idx == 0)
+   continue;
+   fprintf(f, " node[%d] <%s>\n", count, n->name);
+   fprintf(f, "   fence=0x%" PRIx64 "\n", n->fence);
+   fprintf(f, "   objs=%p\n", n->objs);
+   fprintf(f, "   process=%p\n", n->process);
+   fprintf(f, "   id=0x%" PRIx32 "\n", n->id);
+   fprintf(f, "   offset=0x%" PRIx32 "\n", n->off);
+   fprintf(f, "   nb_edges=%" PRId32 "\n", n->nb_edges);
+   fprintf(f, "   realloc_count=%d\n", n->realloc_count);
+   fprintf(f, "   size=%d\n", n->size);
+   fprintf(f, "   idx=%d\n", n->idx);
+   fprintf(f, "   total_objs=%" PRId64 "\n", n->total_objs);
+   fprintf(f, "   total_calls=%" PRId64 "\n", n->total_calls);
+   for (i = 0; i < n->nb_edges; i++)
+   fprintf(f, "  edge[%d] <%s>\n", i,
+   n->nodes[i]->name);
+   }
+}
diff --git a/lib/librte_graph/graph_private.h b/lib/librte_graph/graph_private.h
index 7fce52e00..f9a85c892 100644
--- a/lib/librte_graph/graph_private.h
+++ b/lib/librte_graph/graph_private.h
@@ -319,6 +319,19 @@ struct rte_node *graph_node_id_to_ptr(const struct 
rte_graph *graph,
 struct rte_node *graph_node_name_to_ptr(const struct rte_graph *graph,
const char *node_name);
 
+/* Debug functions */
+/**
+ * 

[dpdk-dev] [PATCH v5 14/29] graph: add performance testcase

2020-04-11 Thread jerinj
From: Pavan Nikhilesh 

Add unit test framework to create and test performance of various graph
models.

example command to test:

echo "graph_perf_autotest" | sudo ./build/app/test/dpdk-test -c 0x30

Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 app/test/Makefile  |1 +
 app/test/meson.build   |1 +
 app/test/test_graph_perf.c | 1057 
 3 files changed, 1059 insertions(+)
 create mode 100644 app/test/test_graph_perf.c

diff --git a/app/test/Makefile b/app/test/Makefile
index ce2e08e12..77276f300 100644
--- a/app/test/Makefile
+++ b/app/test/Makefile
@@ -223,6 +223,7 @@ endif
 
 ifeq ($(CONFIG_RTE_LIBRTE_GRAPH), y)
 SRCS-y += test_graph.c
+SRCS-y += test_graph_perf.c
 endif
 
 ifeq ($(CONFIG_RTE_LIBRTE_RAWDEV),y)
diff --git a/app/test/meson.build b/app/test/meson.build
index 3cf850584..9006cc074 100644
--- a/app/test/meson.build
+++ b/app/test/meson.build
@@ -52,6 +52,7 @@ test_sources = files('commands.c',
'test_func_reentrancy.c',
'test_flow_classify.c',
'test_graph.c',
+   'test_graph_perf.c',
'test_hash.c',
'test_hash_functions.c',
'test_hash_multiwriter.c',
diff --git a/app/test/test_graph_perf.c b/app/test/test_graph_perf.c
new file mode 100644
index 0..3089fb24c
--- /dev/null
+++ b/app/test/test_graph_perf.c
@@ -0,0 +1,1057 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "test.h"
+
+#define TEST_GRAPH_PERF_MZ  "graph_perf_data"
+#define TEST_GRAPH_SRC_NAME "test_graph_perf_source"
+#define TEST_GRAPH_SRC_BRST_ONE_NAME "test_graph_perf_source_one"
+#define TEST_GRAPH_WRK_NAME "test_graph_perf_worker"
+#define TEST_GRAPH_SNK_NAME "test_graph_perf_sink"
+
+#define SOURCES(map)RTE_DIM(map)
+#define STAGES(map) RTE_DIM(map)
+#define NODES_PER_STAGE(map) RTE_DIM(map[0])
+#define SINKS(map)  RTE_DIM(map[0])
+
+#define MAX_EDGES_PER_NODE 7
+
+struct test_node_data {
+   uint8_t node_id;
+   uint8_t is_sink;
+   uint8_t next_nodes[MAX_EDGES_PER_NODE];
+   uint8_t next_percentage[MAX_EDGES_PER_NODE];
+};
+
+struct test_graph_perf {
+   uint16_t nb_nodes;
+   rte_graph_t graph_id;
+   struct test_node_data *node_data;
+};
+
+struct graph_lcore_data {
+   uint8_t done;
+   rte_graph_t graph_id;
+};
+
+static struct test_node_data *
+graph_get_node_data(struct test_graph_perf *graph_data, rte_node_t id)
+{
+   struct test_node_data *node_data = NULL;
+   int i;
+
+   for (i = 0; i < graph_data->nb_nodes; i++)
+   if (graph_data->node_data[i].node_id == id) {
+   node_data = &graph_data->node_data[i];
+   break;
+   }
+
+   return node_data;
+}
+
+static int
+test_node_ctx_init(const struct rte_graph *graph, struct rte_node *node)
+{
+   struct test_graph_perf *graph_data;
+   struct test_node_data *node_data;
+   const struct rte_memzone *mz;
+   rte_node_t nid = node->id;
+   rte_edge_t edge = 0;
+   int i;
+
+   RTE_SET_USED(graph);
+
+   mz = rte_memzone_lookup(TEST_GRAPH_PERF_MZ);
+   graph_data = mz->addr;
+   node_data = graph_get_node_data(graph_data, nid);
+   node->ctx[0] = node->nb_edges;
+   for (i = 0; i < node->nb_edges && !node_data->is_sink; i++, edge++) {
+   node->ctx[i + 1] = edge;
+   node->ctx[i + 9] = node_data->next_percentage[i];
+   }
+
+   return 0;
+}
+
+/* Source node function */
+static uint16_t
+test_perf_node_worker_source(struct rte_graph *graph, struct rte_node *node,
+void **objs, uint16_t nb_objs)
+{
+   uint16_t count;
+   int i;
+
+   RTE_SET_USED(objs);
+   RTE_SET_USED(nb_objs);
+
+   /* Create a proportional stream for every next */
+   for (i = 0; i < node->ctx[0]; i++) {
+   count = (node->ctx[i + 9] * RTE_GRAPH_BURST_SIZE) / 100;
+   rte_node_next_stream_get(graph, node, node->ctx[i + 1], count);
+   rte_node_next_stream_put(graph, node, node->ctx[i + 1], count);
+   }
+
+   return RTE_GRAPH_BURST_SIZE;
+}
+
+static struct rte_node_register test_graph_perf_source = {
+   .name = TEST_GRAPH_SRC_NAME,
+   .process = test_perf_node_worker_source,
+   .flags = RTE_NODE_SOURCE_F,
+   .init = test_node_ctx_init,
+};
+
+RTE_NODE_REGISTER(test_graph_perf_source);
+
+static uint16_t
+test_perf_node_worker_source_burst_one(struct rte_graph *graph,
+  struct rte_node *node, void **objs,
+  uint16_t nb_objs)
+{
+   uint16_t count;
+   int i;
+
+   RTE_SET_USED(objs);
+   RTE_SET_USED(nb_objs);
+
+   /* Crea

[dpdk-dev] [PATCH v5 16/29] node: add ethdev Rx node

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add source rte_node ethdev_rx process function and register
it. This node is a source node that will be called periodically
and when called, performs rte_eth_rx_burst() on a specific
(port, queue) pair and enqueue them as stream of objects to
next node.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Kiran Kumar K 
---
 lib/librte_node/Makefile |   3 +-
 lib/librte_node/ethdev_rx.c  | 221 +++
 lib/librte_node/ethdev_rx_priv.h |  81 +++
 lib/librte_node/meson.build  |   4 +-
 4 files changed, 306 insertions(+), 3 deletions(-)
 create mode 100644 lib/librte_node/ethdev_rx.c
 create mode 100644 lib/librte_node/ethdev_rx_priv.h

diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
index dbc8e1d44..314149385 100644
--- a/lib/librte_node/Makefile
+++ b/lib/librte_node/Makefile
@@ -11,12 +11,13 @@ CFLAGS += -O3 -DALLOW_EXPERIMENTAL_API
 CFLAGS += $(WERROR_FLAGS)
 # Strict-aliasing rules are violated by uint8_t[] to context size casts.
 CFLAGS += -fno-strict-aliasing
-LDLIBS += -lrte_eal -lrte_graph
+LDLIBS += -lrte_eal -lrte_graph -lrte_ethdev
 
 EXPORT_MAP := rte_node_version.map
 
 # all source are stored in SRCS-y
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += null.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += log.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_rx.c
 
 include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_node/ethdev_rx.c b/lib/librte_node/ethdev_rx.c
new file mode 100644
index 0..5cc736598
--- /dev/null
+++ b/lib/librte_node/ethdev_rx.c
@@ -0,0 +1,221 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "ethdev_rx_priv.h"
+#include "node_private.h"
+
+static struct ethdev_rx_node_main ethdev_rx_main;
+
+static __rte_always_inline uint16_t
+ethdev_rx_node_process_inline(struct rte_graph *graph, struct rte_node *node,
+ uint16_t port, uint16_t queue)
+{
+   uint16_t count, next_index = ETHDEV_RX_NEXT_IP4_LOOKUP;
+
+   /* Get pkts from port */
+   count = rte_eth_rx_burst(port, queue, (struct rte_mbuf **)node->objs,
+RTE_GRAPH_BURST_SIZE);
+
+   if (!count)
+   return 0;
+   node->idx = count;
+   /* Enqueue to next node */
+   rte_node_next_stream_move(graph, node, next_index);
+
+   return count;
+}
+
+static __rte_always_inline uint16_t
+ethdev_rx_node_process(struct rte_graph *graph, struct rte_node *node,
+  void **objs, uint16_t cnt)
+{
+   ethdev_rx_node_ctx_t *ctx = (ethdev_rx_node_ctx_t *)node->ctx;
+   uint16_t n_pkts = 0;
+
+   RTE_SET_USED(objs);
+   RTE_SET_USED(cnt);
+
+   n_pkts = ethdev_rx_node_process_inline(graph, node, ctx->port_id,
+  ctx->queue_id);
+   return n_pkts;
+}
+
+static inline uint32_t
+l3_ptype(uint16_t etype, uint32_t ptype)
+{
+   ptype = ptype & ~RTE_PTYPE_L3_MASK;
+   if (etype == rte_cpu_to_be_16(RTE_ETHER_TYPE_IPV4))
+   ptype |= RTE_PTYPE_L3_IPV4_EXT_UNKNOWN;
+   else if (etype == rte_cpu_to_be_16(RTE_ETHER_TYPE_IPV6))
+   ptype |= RTE_PTYPE_L3_IPV6_EXT_UNKNOWN;
+   return ptype;
+}
+
+/* Callback for soft ptype parsing */
+static uint16_t
+eth_pkt_parse_cb(uint16_t port, uint16_t queue, struct rte_mbuf **mbufs,
+uint16_t nb_pkts, uint16_t max_pkts, void *user_param)
+{
+   struct rte_mbuf *mbuf0, *mbuf1, *mbuf2, *mbuf3;
+   struct rte_ether_hdr *eth_hdr;
+   uint16_t etype, n_left;
+   struct rte_mbuf **pkts;
+
+   RTE_SET_USED(port);
+   RTE_SET_USED(queue);
+   RTE_SET_USED(max_pkts);
+   RTE_SET_USED(user_param);
+
+   pkts = mbufs;
+   n_left = nb_pkts;
+   while (n_left >= 12) {
+
+   /* Prefetch next-next mbufs */
+   rte_prefetch0(pkts[8]);
+   rte_prefetch0(pkts[9]);
+   rte_prefetch0(pkts[10]);
+   rte_prefetch0(pkts[11]);
+
+   /* Prefetch next mbuf data */
+   rte_prefetch0(
+   rte_pktmbuf_mtod(pkts[4], struct rte_ether_hdr *));
+   rte_prefetch0(
+   rte_pktmbuf_mtod(pkts[5], struct rte_ether_hdr *));
+   rte_prefetch0(
+   rte_pktmbuf_mtod(pkts[6], struct rte_ether_hdr *));
+   rte_prefetch0(
+   rte_pktmbuf_mtod(pkts[7], struct rte_ether_hdr *));
+
+   mbuf0 = pkts[0];
+   mbuf1 = pkts[1];
+   mbuf2 = pkts[2];
+   mbuf3 = pkts[3];
+   pkts += 4;
+   n_left -= 4;
+
+   /* Extract ptype of mbuf0 */
+   eth_hdr = rte_pktmbuf_mtod(mbuf0, struct rte_ether_hdr *);
+   etype = eth_hdr->ether_type;
+   mbuf0->packet_

[dpdk-dev] [PATCH v5 15/29] node: add log infra and null node

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add log infra for node specific logging.
Also, add null rte_node that just ignores all the objects
directed to it.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Kiran Kumar K 
---
 MAINTAINERS  |  5 +
 app/test/meson.build |  7 +--
 config/common_base   |  5 +
 doc/api/doxy-api.conf.in |  1 +
 lib/Makefile |  3 +++
 lib/librte_node/Makefile | 22 ++
 lib/librte_node/log.c| 14 ++
 lib/librte_node/meson.build  |  8 
 lib/librte_node/node_private.h   | 22 ++
 lib/librte_node/null.c   | 23 +++
 lib/librte_node/rte_node_version.map |  6 ++
 lib/meson.build  |  5 -
 meson.build  |  1 +
 mk/rte.app.mk|  1 +
 14 files changed, 120 insertions(+), 3 deletions(-)
 create mode 100644 lib/librte_node/Makefile
 create mode 100644 lib/librte_node/log.c
 create mode 100644 lib/librte_node/meson.build
 create mode 100644 lib/librte_node/node_private.h
 create mode 100644 lib/librte_node/null.c
 create mode 100644 lib/librte_node/rte_node_version.map

diff --git a/MAINTAINERS b/MAINTAINERS
index aa40cc92b..55fb9bbb0 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -1467,6 +1467,11 @@ M: Jerin Jacob 
 M: Kiran Kumar K 
 F: lib/librte_graph/
 
+Nodes - EXPERIMENTAL
+M: Nithin Dabilpuram 
+M: Pavan Nikhilesh 
+F: lib/librte_node/
+
 
 Test Applications
 -
diff --git a/app/test/meson.build b/app/test/meson.build
index 9006cc074..728d20c1f 100644
--- a/app/test/meson.build
+++ b/app/test/meson.build
@@ -154,7 +154,8 @@ test_deps = ['acl',
'ring',
'stack',
'timer',
-   'graph'
+   'graph',
+   'node'
 ]
 
 # Each test is marked with flag true/false
@@ -390,13 +391,15 @@ endforeach
 test_dep_objs += cc.find_library('execinfo', required: false)
 
 link_libs = []
+link_nodes = []
 if get_option('default_library') == 'static'
link_libs = dpdk_drivers
+   link_nodes = dpdk_graph_nodes
 endif
 
 dpdk_test = executable('dpdk-test',
test_sources,
-   link_whole: link_libs,
+   link_whole: link_libs + link_nodes,
dependencies: test_dep_objs,
c_args: [cflags, '-DALLOW_EXPERIMENTAL_API'],
install_rpath: driver_install_path,
diff --git a/config/common_base b/config/common_base
index 32f982136..1ed5187dc 100644
--- a/config/common_base
+++ b/config/common_base
@@ -1081,6 +1081,11 @@ CONFIG_RTE_LIBRTE_GRAPH=y
 CONFIG_RTE_GRAPH_BURST_SIZE=256
 CONFIG_RTE_LIBRTE_GRAPH_STATS=y
 
+#
+# Compile librte_node
+#
+CONFIG_RTE_LIBRTE_NODE=y
+
 #
 # Compile the test application
 #
diff --git a/doc/api/doxy-api.conf.in b/doc/api/doxy-api.conf.in
index e3b7f54f8..92122125a 100644
--- a/doc/api/doxy-api.conf.in
+++ b/doc/api/doxy-api.conf.in
@@ -49,6 +49,7 @@ INPUT   = @TOPDIR@/doc/api/doxy-api-index.md \
   @TOPDIR@/lib/librte_mempool \
   @TOPDIR@/lib/librte_meter \
   @TOPDIR@/lib/librte_metrics \
+  @TOPDIR@/lib/librte_node \
   @TOPDIR@/lib/librte_net \
   @TOPDIR@/lib/librte_pci \
   @TOPDIR@/lib/librte_pdump \
diff --git a/lib/Makefile b/lib/Makefile
index 1f572b659..50d61a338 100644
--- a/lib/Makefile
+++ b/lib/Makefile
@@ -122,6 +122,9 @@ DEPDIRS-librte_rcu := librte_eal
 DIRS-$(CONFIG_RTE_LIBRTE_GRAPH) += librte_graph
 DEPDIRS-librte_graph := librte_eal
 
+DIRS-$(CONFIG_RTE_LIBRTE_NODE) += librte_node
+DEPDIRS-librte_node := librte_graph librte_lpm librte_ethdev librte_mbuf
+
 ifeq ($(CONFIG_RTE_EXEC_ENV_LINUX),y)
 DIRS-$(CONFIG_RTE_LIBRTE_KNI) += librte_kni
 endif
diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
new file mode 100644
index 0..dbc8e1d44
--- /dev/null
+++ b/lib/librte_node/Makefile
@@ -0,0 +1,22 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(C) 2020 Marvell International Ltd.
+#
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+# library name
+LIB = librte_node.a
+
+CFLAGS += -O3 -DALLOW_EXPERIMENTAL_API
+CFLAGS += $(WERROR_FLAGS)
+# Strict-aliasing rules are violated by uint8_t[] to context size casts.
+CFLAGS += -fno-strict-aliasing
+LDLIBS += -lrte_eal -lrte_graph
+
+EXPORT_MAP := rte_node_version.map
+
+# all source are stored in SRCS-y
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += null.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += log.c
+
+include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_node/log.c b/lib/librte_node/log.c
new file mode 100644
index 0..f035f91e8
--- /dev/null
+++ b/lib/librte_node/log.c
@@ -0,0 +1,14 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include "node_private.h"
+
+int rte_node_logtyp

[dpdk-dev] [PATCH v5 18/29] node: add ethdev Rx and Tx node ctrl API

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add ctrl api to setup ethdev_rx and ethdev_tx node.
This ctrl api clones 'N' number of ethdev_rx and ethdev_tx
nodes with specific (port, queue) pairs updated in their context.
All the ethdev ports and queues are setup before this api
is called.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Kiran Kumar K 
---
 doc/api/doxy-api-index.md|  2 +
 lib/librte_node/Makefile |  6 +-
 lib/librte_node/ethdev_ctrl.c| 99 
 lib/librte_node/meson.build  |  5 +-
 lib/librte_node/node_private.h   | 57 
 lib/librte_node/rte_node_eth_api.h   | 64 ++
 lib/librte_node/rte_node_version.map |  1 +
 7 files changed, 231 insertions(+), 3 deletions(-)
 create mode 100644 lib/librte_node/ethdev_ctrl.c
 create mode 100644 lib/librte_node/rte_node_eth_api.h

diff --git a/doc/api/doxy-api-index.md b/doc/api/doxy-api-index.md
index fd2ff64d7..1784674df 100644
--- a/doc/api/doxy-api-index.md
+++ b/doc/api/doxy-api-index.md
@@ -161,6 +161,8 @@ The public API headers are grouped by topics:
 [table_action] (@ref rte_table_action.h)
   * [graph](@ref rte_graph.h):
 [graph_worker] (@ref rte_graph_worker.h)
+  * graph_nodes:
+[eth_node] (@ref rte_node_eth_api.h),
 
 - **basic**:
   [approx fraction](@ref rte_approx.h),
diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
index 7428f6c43..ea5fa77f7 100644
--- a/lib/librte_node/Makefile
+++ b/lib/librte_node/Makefile
@@ -11,7 +11,7 @@ CFLAGS += -O3 -DALLOW_EXPERIMENTAL_API
 CFLAGS += $(WERROR_FLAGS)
 # Strict-aliasing rules are violated by uint8_t[] to context size casts.
 CFLAGS += -fno-strict-aliasing
-LDLIBS += -lrte_eal -lrte_graph -lrte_mbuf -lrte_ethdev
+LDLIBS += -lrte_eal -lrte_graph -lrte_mbuf -lrte_ethdev -lrte_mempool
 
 EXPORT_MAP := rte_node_version.map
 
@@ -20,5 +20,9 @@ SRCS-$(CONFIG_RTE_LIBRTE_NODE) += null.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += log.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_rx.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_tx.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_ctrl.c
+
+# install header files
+SYMLINK-$(CONFIG_RTE_LIBRTE_NODE)-include += rte_node_eth_api.h
 
 include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_node/ethdev_ctrl.c b/lib/librte_node/ethdev_ctrl.c
new file mode 100644
index 0..599d20b0b
--- /dev/null
+++ b/lib/librte_node/ethdev_ctrl.c
@@ -0,0 +1,99 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+#include 
+
+#include "rte_node_eth_api.h"
+
+#include "ethdev_rx_priv.h"
+#include "ethdev_tx_priv.h"
+#include "node_private.h"
+
+static struct ethdev_ctrl {
+   uint16_t nb_graphs;
+} ctrl;
+
+int
+rte_node_eth_config(struct rte_node_ethdev_config *conf, uint16_t nb_confs,
+   uint16_t nb_graphs)
+{
+   struct ethdev_tx_node_main *tx_node_data;
+   uint16_t tx_q_used, rx_q_used, port_id;
+   struct rte_node_register *tx_node;
+   char name[RTE_NODE_NAMESIZE];
+   struct rte_mempool *mp;
+   uint32_t id;
+   int i, j;
+
+   tx_node_data = ethdev_tx_node_data_get();
+   tx_node = ethdev_tx_node_get();
+   for (i = 0; i < nb_confs; i++) {
+   port_id = conf[i].port_id;
+
+   if (!rte_eth_dev_is_valid_port(port_id))
+   return -EINVAL;
+
+   /* Check for mbuf minimum private size requirement */
+   for (j = 0; j < conf[i].mp_count; j++) {
+   mp = conf[i].mp[j];
+   if (!mp)
+   continue;
+   /* Check for minimum private space */
+   if (rte_pktmbuf_priv_size(mp) < NODE_MBUF_PRIV2_SIZE) {
+   node_err("ethdev",
+"Minimum mbuf priv size requirement 
not met by mp %s",
+mp->name);
+   return -EINVAL;
+   }
+   }
+
+   rx_q_used = conf[i].num_rx_queues;
+   tx_q_used = conf[i].num_tx_queues;
+   /* Check if we have a txq for each worker */
+   if (tx_q_used < nb_graphs)
+   return -EINVAL;
+
+   /* Create node for each rx port queue pair */
+   for (j = 0; j < rx_q_used; j++) {
+   struct ethdev_rx_node_main *rx_node_data;
+   struct rte_node_register *rx_node;
+   ethdev_rx_node_elem_t *elem;
+
+   rx_node_data = ethdev_rx_get_node_data_get();
+   rx_node = ethdev_rx_node_get();
+   snprintf(name, sizeof(name), "%u-%u", port_id, j);
+   /* Clone a new rx node with same edges as parent */
+   i

[dpdk-dev] [PATCH v5 17/29] node: add ethdev Tx node

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add rte_node ethdev_tx process function and register it to
graph infra. This node has a specific (port, tx-queue) as context
and it enqueue's all the packets received to that specific queue pair.
When rte_eth_tx_burst() i.e enqueue to queue pair fails, packets
are forwarded to pkt_drop node to be free'd.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Kiran Kumar K 
---
 lib/librte_node/Makefile |  3 +-
 lib/librte_node/ethdev_tx.c  | 86 
 lib/librte_node/ethdev_tx_priv.h | 62 +++
 lib/librte_node/meson.build  |  4 +-
 4 files changed, 152 insertions(+), 3 deletions(-)
 create mode 100644 lib/librte_node/ethdev_tx.c
 create mode 100644 lib/librte_node/ethdev_tx_priv.h

diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
index 314149385..7428f6c43 100644
--- a/lib/librte_node/Makefile
+++ b/lib/librte_node/Makefile
@@ -11,7 +11,7 @@ CFLAGS += -O3 -DALLOW_EXPERIMENTAL_API
 CFLAGS += $(WERROR_FLAGS)
 # Strict-aliasing rules are violated by uint8_t[] to context size casts.
 CFLAGS += -fno-strict-aliasing
-LDLIBS += -lrte_eal -lrte_graph -lrte_ethdev
+LDLIBS += -lrte_eal -lrte_graph -lrte_mbuf -lrte_ethdev
 
 EXPORT_MAP := rte_node_version.map
 
@@ -19,5 +19,6 @@ EXPORT_MAP := rte_node_version.map
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += null.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += log.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_rx.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_tx.c
 
 include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_node/ethdev_tx.c b/lib/librte_node/ethdev_tx.c
new file mode 100644
index 0..075149089
--- /dev/null
+++ b/lib/librte_node/ethdev_tx.c
@@ -0,0 +1,86 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "ethdev_tx_priv.h"
+
+static struct ethdev_tx_node_main ethdev_tx_main;
+
+static uint16_t
+ethdev_tx_node_process(struct rte_graph *graph, struct rte_node *node,
+  void **objs, uint16_t nb_objs)
+{
+   ethdev_tx_node_ctx_t *ctx = (ethdev_tx_node_ctx_t *)node->ctx;
+   uint16_t port, queue;
+   uint16_t count;
+
+   /* Get Tx port id */
+   port = ctx->port;
+   queue = ctx->queue;
+
+   count = rte_eth_tx_burst(port, queue, (struct rte_mbuf **)objs,
+nb_objs);
+
+   /* Redirect unsent pkts to drop node */
+   if (count != nb_objs) {
+   rte_node_enqueue(graph, node, ETHDEV_TX_NEXT_PKT_DROP,
+&objs[count], nb_objs - count);
+   }
+
+   return count;
+}
+
+static int
+ethdev_tx_node_init(const struct rte_graph *graph, struct rte_node *node)
+{
+   ethdev_tx_node_ctx_t *ctx = (ethdev_tx_node_ctx_t *)node->ctx;
+   uint64_t port_id = RTE_MAX_ETHPORTS;
+   int i;
+
+   /* Find our port id */
+   for (i = 0; i < RTE_MAX_ETHPORTS; i++) {
+   if (ethdev_tx_main.nodes[i] == node->id) {
+   port_id = i;
+   break;
+   }
+   }
+   RTE_VERIFY(port_id < RTE_MAX_ETHPORTS);
+
+   /* Update port and queue */
+   ctx->port = port_id;
+   ctx->queue = graph->id;
+
+   return 0;
+}
+
+struct ethdev_tx_node_main *
+ethdev_tx_node_data_get(void)
+{
+   return ðdev_tx_main;
+}
+
+static struct rte_node_register ethdev_tx_node_base = {
+   .process = ethdev_tx_node_process,
+   .name = "ethdev_tx",
+
+   .init = ethdev_tx_node_init,
+
+   .nb_edges = ETHDEV_TX_NEXT_MAX,
+   .next_nodes = {
+   [ETHDEV_TX_NEXT_PKT_DROP] = "pkt_drop",
+   },
+};
+
+struct rte_node_register *
+ethdev_tx_node_get(void)
+{
+   return ðdev_tx_node_base;
+}
+
+RTE_NODE_REGISTER(ethdev_tx_node_base);
diff --git a/lib/librte_node/ethdev_tx_priv.h b/lib/librte_node/ethdev_tx_priv.h
new file mode 100644
index 0..586bff44a
--- /dev/null
+++ b/lib/librte_node/ethdev_tx_priv.h
@@ -0,0 +1,62 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+#ifndef __INCLUDE_ETHDEV_TX_PRIV_H__
+#define __INCLUDE_ETHDEV_TX_PRIV_H__
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+struct ethdev_tx_node_ctx;
+typedef struct ethdev_tx_node_ctx ethdev_tx_node_ctx_t;
+
+enum ethdev_tx_next_nodes {
+   ETHDEV_TX_NEXT_PKT_DROP,
+   ETHDEV_TX_NEXT_MAX,
+};
+
+/**
+ * @internal
+ *
+ * Ethernet Tx node context structure.
+ */
+struct ethdev_tx_node_ctx {
+   uint16_t port;  /**< Port identifier of the Ethernet Tx node. */
+   uint16_t queue; /**< Queue identifier of the Ethernet Tx node. */
+};
+
+/**
+ * @internal
+ *
+ * Ethernet Tx node main structure.
+ */
+struct ethdev_tx_node_main {
+   uint32_t nodes[RTE_MAX_ETHPORTS]; /**< Tx nodes for each ethdev port. */
+};
+
+/**
+ * @internal
+ *
+ * Get the Ethernet Tx node data.
+ *
+ * @return
+ 

[dpdk-dev] [PATCH v5 20/29] node: ipv4 lookup for arm64

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add arm64 specific IPv4 lookup process function
for ip4_lookup node. This node performs LPM lookup
on every packet received and forwards it to a next
node that is identified by lookup result.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
---
 lib/librte_node/ip4_lookup.c  |   6 +
 lib/librte_node/ip4_lookup_neon.h | 238 ++
 2 files changed, 244 insertions(+)
 create mode 100644 lib/librte_node/ip4_lookup_neon.h

diff --git a/lib/librte_node/ip4_lookup.c b/lib/librte_node/ip4_lookup.c
index 988bc5e0c..8ec4f0626 100644
--- a/lib/librte_node/ip4_lookup.c
+++ b/lib/librte_node/ip4_lookup.c
@@ -28,6 +28,10 @@ struct ip4_lookup_node_main {
struct rte_lpm *lpm_tbl[RTE_MAX_NUMA_NODES];
 };
 
+#if defined(RTE_MACHINE_CPUFLAG_NEON)
+#include "ip4_lookup_neon.h"
+#else
+
 static uint16_t
 ip4_lookup_node_process(struct rte_graph *graph, struct rte_node *node,
void **objs, uint16_t nb_objs)
@@ -101,6 +105,8 @@ ip4_lookup_node_process(struct rte_graph *graph, struct 
rte_node *node,
return nb_objs;
 }
 
+#endif
+
 static int
 ip4_lookup_node_init(const struct rte_graph *graph, struct rte_node *node)
 {
diff --git a/lib/librte_node/ip4_lookup_neon.h 
b/lib/librte_node/ip4_lookup_neon.h
new file mode 100644
index 0..bb3150ff2
--- /dev/null
+++ b/lib/librte_node/ip4_lookup_neon.h
@@ -0,0 +1,238 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#ifndef __INCLUDE_IP4_LOOKUP_NEON_H__
+#define __INCLUDE_IP4_LOOKUP_NEON_H__
+
+/* ARM64 NEON */
+static uint16_t
+ip4_lookup_node_process(struct rte_graph *graph, struct rte_node *node,
+   void **objs, uint16_t nb_objs)
+{
+   struct rte_mbuf *mbuf0, *mbuf1, *mbuf2, *mbuf3, **pkts;
+   struct rte_ipv4_hdr *ipv4_hdr;
+   void **to_next, **from;
+   uint16_t last_spec = 0;
+   rte_edge_t next_index;
+   uint16_t n_left_from;
+   struct rte_lpm *lpm;
+   uint16_t held = 0;
+   uint32_t drop_nh;
+   rte_xmm_t result;
+   rte_xmm_t priv01;
+   rte_xmm_t priv23;
+   int32x4_t dip;
+   int rc, i;
+
+   /* Speculative next */
+   next_index = RTE_NODE_IP4_LOOKUP_NEXT_REWRITE;
+   /* Drop node */
+   drop_nh = ((uint32_t)RTE_NODE_IP4_LOOKUP_NEXT_PKT_DROP) << 16;
+
+   /* Get socket specific LPM from ctx */
+   lpm = *((struct rte_lpm **)node->ctx);
+
+   pkts = (struct rte_mbuf **)objs;
+   from = objs;
+   n_left_from = nb_objs;
+
+#define OBJS_PER_CLINE (RTE_CACHE_LINE_SIZE / sizeof(void *))
+   for (i = OBJS_PER_CLINE; i < RTE_GRAPH_BURST_SIZE; i += OBJS_PER_CLINE)
+   rte_prefetch0(&objs[i]);
+
+   for (i = 0; i < 4 && i < n_left_from; i++)
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[i], void *,
+   sizeof(struct rte_ether_hdr)));
+
+   /* Get stream for the speculated next node */
+   to_next = rte_node_next_stream_get(graph, node, next_index, nb_objs);
+   while (n_left_from >= 4) {
+#if RTE_GRAPH_BURST_SIZE > 64
+   /* Prefetch next-next mbufs */
+   if (likely(n_left_from > 11)) {
+   rte_prefetch0(pkts[8]);
+   rte_prefetch0(pkts[9]);
+   rte_prefetch0(pkts[10]);
+   rte_prefetch0(pkts[11]);
+   }
+#endif
+   /* Prefetch next mbuf data */
+   if (likely(n_left_from > 7)) {
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[4], void *,
+   sizeof(struct rte_ether_hdr)));
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[5], void *,
+   sizeof(struct rte_ether_hdr)));
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[6], void *,
+   sizeof(struct rte_ether_hdr)));
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[7], void *,
+   sizeof(struct rte_ether_hdr)));
+   }
+
+   mbuf0 = pkts[0];
+   mbuf1 = pkts[1];
+   mbuf2 = pkts[2];
+   mbuf3 = pkts[3];
+
+   pkts += 4;
+   n_left_from -= 4;
+
+   /* Extract DIP of mbuf0 */
+   ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf0, struct rte_ipv4_hdr *,
+   sizeof(struct rte_ether_hdr));
+   dip = vsetq_lane_s32(ipv4_hdr->dst_addr, dip, 0);
+   /* Extract cksum, ttl as ipv4 hdr is in cache */
+   priv01.u16[1] = ipv4_hdr->time_to_live;
+   priv01.u32[1] = ipv4_hdr->hdr_checksum;
+
+   /* Extract DIP of mbuf1 */
+   ipv4_hdr = rte_pktmbuf_mtod_offse

[dpdk-dev] [PATCH v5 22/29] node: add ipv4 rewrite node

2020-04-11 Thread jerinj
From: Kiran Kumar K 

Add ip4 rewrite process function for ip4_rewrite
rte_node. On every packet received by this node,
header is overwritten with new data before forwarding
it to next node. Header data to overwrite with is
identified by next hop id passed in mbuf priv data
by previous node.

Signed-off-by: Kiran Kumar K 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 lib/librte_node/Makefile   |   1 +
 lib/librte_node/ip4_rewrite.c  | 270 +
 lib/librte_node/ip4_rewrite_priv.h |  55 ++
 lib/librte_node/meson.build|   2 +-
 4 files changed, 327 insertions(+), 1 deletion(-)
 create mode 100644 lib/librte_node/ip4_rewrite.c
 create mode 100644 lib/librte_node/ip4_rewrite_priv.h

diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
index ad3f2e349..ebf473c66 100644
--- a/lib/librte_node/Makefile
+++ b/lib/librte_node/Makefile
@@ -22,6 +22,7 @@ SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_rx.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_tx.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_ctrl.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ip4_lookup.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ip4_rewrite.c
 
 # install header files
 SYMLINK-$(CONFIG_RTE_LIBRTE_NODE)-include += rte_node_ip4_api.h
diff --git a/lib/librte_node/ip4_rewrite.c b/lib/librte_node/ip4_rewrite.c
new file mode 100644
index 0..333e34761
--- /dev/null
+++ b/lib/librte_node/ip4_rewrite.c
@@ -0,0 +1,270 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "rte_node_ip4_api.h"
+
+#include "ip4_rewrite_priv.h"
+#include "node_private.h"
+
+static struct ip4_rewrite_node_main *ip4_rewrite_nm;
+
+static uint16_t
+ip4_rewrite_node_process(struct rte_graph *graph, struct rte_node *node,
+void **objs, uint16_t nb_objs)
+{
+   struct rte_mbuf *mbuf0, *mbuf1, *mbuf2, *mbuf3, **pkts;
+   struct ip4_rewrite_nh_header *nh = ip4_rewrite_nm->nh;
+   uint16_t next0, next1, next2, next3, next_index;
+   struct rte_ipv4_hdr *ip0, *ip1, *ip2, *ip3;
+   uint16_t n_left_from, held = 0, last_spec = 0;
+   void *d0, *d1, *d2, *d3;
+   void **to_next, **from;
+   rte_xmm_t priv01;
+   rte_xmm_t priv23;
+   int i;
+
+   /* Speculative next as last next */
+   next_index = *(uint16_t *)node->ctx;
+   rte_prefetch0(nh);
+
+   pkts = (struct rte_mbuf **)objs;
+   from = objs;
+   n_left_from = nb_objs;
+
+   for (i = 0; i < 4 && i < n_left_from; i++)
+   rte_prefetch0(pkts[i]);
+
+   /* Get stream for the speculated next node */
+   to_next = rte_node_next_stream_get(graph, node, next_index, nb_objs);
+   /* Update Ethernet header of pkts */
+   while (n_left_from >= 4) {
+   if (likely(n_left_from > 7)) {
+   /* Prefetch only next-mbuf struct and priv area.
+* Data need not be prefetched as we only write.
+*/
+   rte_prefetch0(pkts[4]);
+   rte_prefetch0(pkts[5]);
+   rte_prefetch0(pkts[6]);
+   rte_prefetch0(pkts[7]);
+   }
+
+   mbuf0 = pkts[0];
+   mbuf1 = pkts[1];
+   mbuf2 = pkts[2];
+   mbuf3 = pkts[3];
+
+   pkts += 4;
+   n_left_from -= 4;
+   priv01.u64[0] = node_mbuf_priv1(mbuf0)->u;
+   priv01.u64[1] = node_mbuf_priv1(mbuf1)->u;
+   priv23.u64[0] = node_mbuf_priv1(mbuf2)->u;
+   priv23.u64[1] = node_mbuf_priv1(mbuf3)->u;
+
+   /* Increment checksum by one. */
+   priv01.u32[1] += rte_cpu_to_be_16(0x0100);
+   priv01.u32[3] += rte_cpu_to_be_16(0x0100);
+   priv23.u32[1] += rte_cpu_to_be_16(0x0100);
+   priv23.u32[3] += rte_cpu_to_be_16(0x0100);
+
+   /* Update ttl,cksum rewrite ethernet hdr on mbuf0 */
+   d0 = rte_pktmbuf_mtod(mbuf0, void *);
+   rte_memcpy(d0, nh[priv01.u16[0]].rewrite_data,
+  nh[priv01.u16[0]].rewrite_len);
+
+   next0 = nh[priv01.u16[0]].tx_node;
+   ip0 = (struct rte_ipv4_hdr *)((uint8_t *)d0 +
+ sizeof(struct rte_ether_hdr));
+   ip0->time_to_live = priv01.u16[1] - 1;
+   ip0->hdr_checksum = priv01.u16[2] + priv01.u16[3];
+
+   /* Update ttl,cksum rewrite ethernet hdr on mbuf1 */
+   d1 = rte_pktmbuf_mtod(mbuf1, void *);
+   rte_memcpy(d1, nh[priv01.u16[4]].rewrite_data,
+  nh[priv01.u16[4]].rewrite_len);
+
+   next1 = nh[priv01.u16[4]].tx_node;
+   ip1 = (struct rte_ipv4_hdr *)((uint8_t *)d1 +
+

[dpdk-dev] [PATCH v5 19/29] node: add generic ipv4 lookup node

2020-04-11 Thread jerinj
From: Pavan Nikhilesh 

Add IPv4 lookup process function for ip4_lookup node.
This node performs LPM lookup using simple RTE_LPM API on every packet
received and forwards it to a next node that is identified by lookup
result.

Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
---
 doc/api/doxy-api-index.md  |   1 +
 lib/librte_node/Makefile   |   4 +-
 lib/librte_node/ip4_lookup.c   | 128 +
 lib/librte_node/meson.build|   5 +-
 lib/librte_node/rte_node_ip4_api.h |  40 +
 5 files changed, 175 insertions(+), 3 deletions(-)
 create mode 100644 lib/librte_node/ip4_lookup.c
 create mode 100644 lib/librte_node/rte_node_ip4_api.h

diff --git a/doc/api/doxy-api-index.md b/doc/api/doxy-api-index.md
index 1784674df..3908fddde 100644
--- a/doc/api/doxy-api-index.md
+++ b/doc/api/doxy-api-index.md
@@ -163,6 +163,7 @@ The public API headers are grouped by topics:
 [graph_worker] (@ref rte_graph_worker.h)
   * graph_nodes:
 [eth_node] (@ref rte_node_eth_api.h),
+[ip4_node] (@ref rte_node_ip4_api.h)
 
 - **basic**:
   [approx fraction](@ref rte_approx.h),
diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
index ea5fa77f7..ad3f2e349 100644
--- a/lib/librte_node/Makefile
+++ b/lib/librte_node/Makefile
@@ -11,7 +11,7 @@ CFLAGS += -O3 -DALLOW_EXPERIMENTAL_API
 CFLAGS += $(WERROR_FLAGS)
 # Strict-aliasing rules are violated by uint8_t[] to context size casts.
 CFLAGS += -fno-strict-aliasing
-LDLIBS += -lrte_eal -lrte_graph -lrte_mbuf -lrte_ethdev -lrte_mempool
+LDLIBS += -lrte_eal -lrte_graph -lrte_mbuf -lrte_lpm -lrte_ethdev -lrte_mempool
 
 EXPORT_MAP := rte_node_version.map
 
@@ -21,8 +21,10 @@ SRCS-$(CONFIG_RTE_LIBRTE_NODE) += log.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_rx.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_tx.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_ctrl.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ip4_lookup.c
 
 # install header files
+SYMLINK-$(CONFIG_RTE_LIBRTE_NODE)-include += rte_node_ip4_api.h
 SYMLINK-$(CONFIG_RTE_LIBRTE_NODE)-include += rte_node_eth_api.h
 
 include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_node/ip4_lookup.c b/lib/librte_node/ip4_lookup.c
new file mode 100644
index 0..988bc5e0c
--- /dev/null
+++ b/lib/librte_node/ip4_lookup.c
@@ -0,0 +1,128 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "rte_node_ip4_api.h"
+
+#include "node_private.h"
+
+#define IPV4_L3FWD_LPM_MAX_RULES 1024
+#define IPV4_L3FWD_LPM_NUMBER_TBL8S (1 << 8)
+
+/* IP4 Lookup global data struct */
+struct ip4_lookup_node_main {
+   struct rte_lpm *lpm_tbl[RTE_MAX_NUMA_NODES];
+};
+
+static uint16_t
+ip4_lookup_node_process(struct rte_graph *graph, struct rte_node *node,
+   void **objs, uint16_t nb_objs)
+{
+   struct rte_ipv4_hdr *ipv4_hdr;
+   void **to_next, **from;
+   uint16_t last_spec = 0;
+   struct rte_mbuf *mbuf;
+   rte_edge_t next_index;
+   struct rte_lpm *lpm;
+   uint16_t held = 0;
+   uint32_t drop_nh;
+   int i, rc;
+
+   /* Speculative next */
+   next_index = RTE_NODE_IP4_LOOKUP_NEXT_REWRITE;
+   /* Drop node */
+   drop_nh = ((uint32_t)RTE_NODE_IP4_LOOKUP_NEXT_PKT_DROP) << 16;
+
+   /* Get socket specific LPM from ctx */
+   lpm = *((struct rte_lpm **)node->ctx);
+   from = objs;
+
+   /* Get stream for the speculated next node */
+   to_next = rte_node_next_stream_get(graph, node, next_index, nb_objs);
+   for (i = 0; i < nb_objs; i++) {
+   uint32_t next_hop;
+   uint16_t next;
+
+   mbuf = (struct rte_mbuf *)objs[i];
+
+   /* Extract DIP of mbuf0 */
+   ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf, struct rte_ipv4_hdr *,
+   sizeof(struct rte_ether_hdr));
+   /* Extract cksum, ttl as ipv4 hdr is in cache */
+   node_mbuf_priv1(mbuf)->cksum = ipv4_hdr->hdr_checksum;
+   node_mbuf_priv1(mbuf)->ttl = ipv4_hdr->time_to_live;
+
+   rc = rte_lpm_lookup(lpm, rte_be_to_cpu_32(ipv4_hdr->dst_addr),
+   &next_hop);
+   next_hop = (rc == 0) ? next_hop : drop_nh;
+
+   node_mbuf_priv1(mbuf)->nh = (uint16_t)next_hop;
+   next_hop = next_hop >> 16;
+   next = (uint16_t)next_hop;
+
+   if (unlikely(next_index != next)) {
+   /* Copy things successfully speculated till now */
+   rte_memcpy(to_next, from, last_spec * sizeof(from[0]));
+   from += last_spec;
+   to_next += last_spec;
+   held += last_spec;
+   last_spec = 0;
+
+

[dpdk-dev] [PATCH v5 21/29] node: ipv4 lookup for x86

2020-04-11 Thread jerinj
From: Pavan Nikhilesh 

Add IPv4 lookup process function for ip4_lookup
rte_node. This node performs LPM lookup using x86_64
vector supported RTE_LPM API on every packet received
and forwards it to a next node that is identified by
lookup result.

Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Kiran Kumar K 
---
 lib/librte_node/ip4_lookup.c |   2 +
 lib/librte_node/ip4_lookup_sse.h | 244 +++
 2 files changed, 246 insertions(+)
 create mode 100644 lib/librte_node/ip4_lookup_sse.h

diff --git a/lib/librte_node/ip4_lookup.c b/lib/librte_node/ip4_lookup.c
index 8ec4f0626..39c8d8db0 100644
--- a/lib/librte_node/ip4_lookup.c
+++ b/lib/librte_node/ip4_lookup.c
@@ -30,6 +30,8 @@ struct ip4_lookup_node_main {
 
 #if defined(RTE_MACHINE_CPUFLAG_NEON)
 #include "ip4_lookup_neon.h"
+#elif defined(RTE_ARCH_X86)
+#include "ip4_lookup_sse.h"
 #else
 
 static uint16_t
diff --git a/lib/librte_node/ip4_lookup_sse.h b/lib/librte_node/ip4_lookup_sse.h
new file mode 100644
index 0..a071cc591
--- /dev/null
+++ b/lib/librte_node/ip4_lookup_sse.h
@@ -0,0 +1,244 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#ifndef __INCLUDE_IP4_LOOKUP_SSE_H__
+#define __INCLUDE_IP4_LOOKUP_SSE_H__
+
+/* X86 SSE */
+static uint16_t
+ip4_lookup_node_process(struct rte_graph *graph, struct rte_node *node,
+   void **objs, uint16_t nb_objs)
+{
+   struct rte_mbuf *mbuf0, *mbuf1, *mbuf2, *mbuf3, **pkts;
+   rte_edge_t next0, next1, next2, next3, next_index;
+   struct rte_ipv4_hdr *ipv4_hdr;
+   uint32_t ip0, ip1, ip2, ip3;
+   void **to_next, **from;
+   uint16_t last_spec = 0;
+   uint16_t n_left_from;
+   struct rte_lpm *lpm;
+   uint16_t held = 0;
+   uint32_t drop_nh;
+   rte_xmm_t dst;
+   __m128i dip; /* SSE register */
+   int rc, i;
+
+   /* Speculative next */
+   next_index = RTE_NODE_IP4_LOOKUP_NEXT_REWRITE;
+   /* Drop node */
+   drop_nh = ((uint32_t)RTE_NODE_IP4_LOOKUP_NEXT_PKT_DROP) << 16;
+
+   /* Get socket specific LPM from ctx */
+   lpm = *((struct rte_lpm **)node->ctx);
+
+   pkts = (struct rte_mbuf **)objs;
+   from = objs;
+   n_left_from = nb_objs;
+
+   if (n_left_from >= 4) {
+   for (i = 0; i < 4; i++)
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[i], void *,
+   sizeof(struct rte_ether_hdr)));
+   }
+
+   /* Get stream for the speculated next node */
+   to_next = rte_node_next_stream_get(graph, node, next_index, nb_objs);
+   while (n_left_from >= 4) {
+   /* Prefetch next-next mbufs */
+   if (likely(n_left_from > 11)) {
+   rte_prefetch0(pkts[8]);
+   rte_prefetch0(pkts[9]);
+   rte_prefetch0(pkts[10]);
+   rte_prefetch0(pkts[11]);
+   }
+
+   /* Prefetch next mbuf data */
+   if (likely(n_left_from > 7)) {
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[4], void *,
+   sizeof(struct rte_ether_hdr)));
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[5], void *,
+   sizeof(struct rte_ether_hdr)));
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[6], void *,
+   sizeof(struct rte_ether_hdr)));
+   rte_prefetch0(rte_pktmbuf_mtod_offset(pkts[7], void *,
+   sizeof(struct rte_ether_hdr)));
+   }
+
+   mbuf0 = pkts[0];
+   mbuf1 = pkts[1];
+   mbuf2 = pkts[2];
+   mbuf3 = pkts[3];
+
+   pkts += 4;
+   n_left_from -= 4;
+
+   /* Extract DIP of mbuf0 */
+   ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf0, struct rte_ipv4_hdr *,
+   sizeof(struct rte_ether_hdr));
+   ip0 = ipv4_hdr->dst_addr;
+   /* Extract cksum, ttl as ipv4 hdr is in cache */
+   node_mbuf_priv1(mbuf0)->cksum = ipv4_hdr->hdr_checksum;
+   node_mbuf_priv1(mbuf0)->ttl = ipv4_hdr->time_to_live;
+
+   /* Extract DIP of mbuf1 */
+   ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf1, struct rte_ipv4_hdr *,
+   sizeof(struct rte_ether_hdr));
+   ip1 = ipv4_hdr->dst_addr;
+   /* Extract cksum, ttl as ipv4 hdr is in cache */
+   node_mbuf_priv1(mbuf1)->cksum = ipv4_hdr->hdr_checksum;
+   node_mbuf_priv1(mbuf1)->ttl = ipv4_hdr->time_to_live;
+
+   /* Extract DIP of mbuf2 */
+   ipv4_hdr = rte_pktmbuf_mtod_offset(mbuf2, struct rte_ipv4_hdr *

[dpdk-dev] [PATCH v5 24/29] node: add packet drop node

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add packet drop node process function for pkt_drop
rte_node. This node simply free's every object received as
an rte_mbuf to its rte_pktmbuf pool.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Kiran Kumar K 
---
 lib/librte_node/Makefile|  1 +
 lib/librte_node/meson.build |  2 +-
 lib/librte_node/pkt_drop.c  | 26 ++
 3 files changed, 28 insertions(+), 1 deletion(-)
 create mode 100644 lib/librte_node/pkt_drop.c

diff --git a/lib/librte_node/Makefile b/lib/librte_node/Makefile
index ebf473c66..322b651c8 100644
--- a/lib/librte_node/Makefile
+++ b/lib/librte_node/Makefile
@@ -23,6 +23,7 @@ SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_tx.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ethdev_ctrl.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ip4_lookup.c
 SRCS-$(CONFIG_RTE_LIBRTE_NODE) += ip4_rewrite.c
+SRCS-$(CONFIG_RTE_LIBRTE_NODE) += pkt_drop.c
 
 # install header files
 SYMLINK-$(CONFIG_RTE_LIBRTE_NODE)-include += rte_node_ip4_api.h
diff --git a/lib/librte_node/meson.build b/lib/librte_node/meson.build
index ed78791dd..8aa93654b 100644
--- a/lib/librte_node/meson.build
+++ b/lib/librte_node/meson.build
@@ -2,7 +2,7 @@
 # Copyright(C) 2020 Marvell International Ltd.
 
 sources = files('null.c', 'log.c', 'ethdev_rx.c', 'ethdev_tx.c', 
'ip4_lookup.c',
-   'ip4_rewrite.c', 'ethdev_ctrl.c')
+   'ip4_rewrite.c', 'pkt_drop.c', 'ethdev_ctrl.c')
 headers = files('rte_node_ip4_api.h', 'rte_node_eth_api.h')
 allow_experimental_apis = true
 # Strict-aliasing rules are violated by uint8_t[] to context size casts.
diff --git a/lib/librte_node/pkt_drop.c b/lib/librte_node/pkt_drop.c
new file mode 100644
index 0..c35001323
--- /dev/null
+++ b/lib/librte_node/pkt_drop.c
@@ -0,0 +1,26 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+
+static uint16_t
+pkt_drop_process(struct rte_graph *graph, struct rte_node *node, void **objs,
+uint16_t nb_objs)
+{
+   RTE_SET_USED(node);
+   RTE_SET_USED(graph);
+
+   rte_pktmbuf_free_bulk((struct rte_mbuf **)objs, nb_objs);
+
+   return nb_objs;
+}
+
+static struct rte_node_register pkt_drop_node = {
+   .process = pkt_drop_process,
+   .name = "pkt_drop",
+};
+
+RTE_NODE_REGISTER(pkt_drop_node);
-- 
2.25.1



[dpdk-dev] [PATCH v5 23/29] node: add ipv4 rewrite and lookup ctrl API

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add ip4_rewrite and ip4_lookup ctrl API. ip4_lookup ctrl
API is used to add route entries for LPM lookup with
result data containing next hop id and next proto.
ip4_rewrite ctrl API is used to add rewrite data for
every next hop.

Signed-off-by: Nithin Dabilpuram 
Signed-off-by: Pavan Nikhilesh 
Signed-off-by: Kiran Kumar K 
---
 lib/librte_node/ethdev_ctrl.c| 18 ++-
 lib/librte_node/ip4_lookup.c | 79 
 lib/librte_node/ip4_rewrite.c| 56 
 lib/librte_node/ip4_rewrite_priv.h   | 22 
 lib/librte_node/rte_node_ip4_api.h   | 38 +
 lib/librte_node/rte_node_version.map |  2 +
 6 files changed, 214 insertions(+), 1 deletion(-)

diff --git a/lib/librte_node/ethdev_ctrl.c b/lib/librte_node/ethdev_ctrl.c
index 599d20b0b..13b8b705f 100644
--- a/lib/librte_node/ethdev_ctrl.c
+++ b/lib/librte_node/ethdev_ctrl.c
@@ -11,6 +11,7 @@
 
 #include "ethdev_rx_priv.h"
 #include "ethdev_tx_priv.h"
+#include "ip4_rewrite_priv.h"
 #include "node_private.h"
 
 static struct ethdev_ctrl {
@@ -21,14 +22,17 @@ int
 rte_node_eth_config(struct rte_node_ethdev_config *conf, uint16_t nb_confs,
uint16_t nb_graphs)
 {
+   struct rte_node_register *ip4_rewrite_node;
struct ethdev_tx_node_main *tx_node_data;
uint16_t tx_q_used, rx_q_used, port_id;
struct rte_node_register *tx_node;
char name[RTE_NODE_NAMESIZE];
+   const char *next_nodes = name;
struct rte_mempool *mp;
+   int i, j, rc;
uint32_t id;
-   int i, j;
 
+   ip4_rewrite_node = ip4_rewrite_node_get();
tx_node_data = ethdev_tx_node_data_get();
tx_node = ethdev_tx_node_get();
for (i = 0; i < nb_confs; i++) {
@@ -92,6 +96,18 @@ rte_node_eth_config(struct rte_node_ethdev_config *conf, 
uint16_t nb_confs,
 
node_dbg("ethdev", "Tx node %s-%s: is at %u", tx_node->name,
 name, id);
+
+   /* Prepare the actual name of the cloned node */
+   snprintf(name, sizeof(name), "ethdev_tx-%u", port_id);
+
+   /* Add this tx port node as next to ip4_rewrite_node */
+   rte_node_edge_update(ip4_rewrite_node->id, RTE_EDGE_ID_INVALID,
+&next_nodes, 1);
+   /* Assuming edge id is the last one alloc'ed */
+   rc = ip4_rewrite_set_next(
+   port_id, rte_node_edge_count(ip4_rewrite_node->id) - 1);
+   if (rc < 0)
+   return rc;
}
 
ctrl.nb_graphs = nb_graphs;
diff --git a/lib/librte_node/ip4_lookup.c b/lib/librte_node/ip4_lookup.c
index 39c8d8db0..8e6379457 100644
--- a/lib/librte_node/ip4_lookup.c
+++ b/lib/librte_node/ip4_lookup.c
@@ -28,6 +28,8 @@ struct ip4_lookup_node_main {
struct rte_lpm *lpm_tbl[RTE_MAX_NUMA_NODES];
 };
 
+static struct ip4_lookup_node_main ip4_lookup_nm;
+
 #if defined(RTE_MACHINE_CPUFLAG_NEON)
 #include "ip4_lookup_neon.h"
 #elif defined(RTE_ARCH_X86)
@@ -109,12 +111,89 @@ ip4_lookup_node_process(struct rte_graph *graph, struct 
rte_node *node,
 
 #endif
 
+int
+rte_node_ip4_route_add(uint32_t ip, uint8_t depth, uint16_t next_hop,
+  enum rte_node_ip4_lookup_next next_node)
+{
+   char abuf[INET6_ADDRSTRLEN];
+   struct in_addr in;
+   uint8_t socket;
+   uint32_t val;
+   int ret;
+
+   in.s_addr = htonl(ip);
+   inet_ntop(AF_INET, &in, abuf, sizeof(abuf));
+   /* Embedded next node id into 24 bit next hop */
+   val = ((next_node << 16) | next_hop) & ((1ull << 24) - 1);
+   node_dbg("ip4_lookup", "LPM: Adding route %s / %d nh (0x%x)", abuf,
+depth, val);
+
+   for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) {
+   if (!ip4_lookup_nm.lpm_tbl[socket])
+   continue;
+
+   ret = rte_lpm_add(ip4_lookup_nm.lpm_tbl[socket],
+ ip, depth, val);
+   if (ret < 0) {
+   node_err("ip4_lookup",
+"Unable to add entry %s / %d nh (%x) to LPM 
table on sock %d, rc=%d\n",
+abuf, depth, val, socket, ret);
+   return ret;
+   }
+   }
+
+   return 0;
+}
+
+static int
+setup_lpm(struct ip4_lookup_node_main *nm, int socket)
+{
+   struct rte_lpm_config config_ipv4;
+   char s[RTE_LPM_NAMESIZE];
+
+   /* One LPM table per socket */
+   if (nm->lpm_tbl[socket])
+   return 0;
+
+   /* create the LPM table */
+   config_ipv4.max_rules = IPV4_L3FWD_LPM_MAX_RULES;
+   config_ipv4.number_tbl8s = IPV4_L3FWD_LPM_NUMBER_TBL8S;
+   config_ipv4.flags = 0;
+   snprintf(s, sizeof(s), "IPV4_L3FWD_LPM_%d", socket);
+   nm->lpm_tbl[socket] = rte_lpm_create(s, socket, &config_ipv4);
+   if (nm->lpm_tbl[socket] == NULL)
+

[dpdk-dev] [PATCH v5 29/29] doc: add l3fwd graph application user guide

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Adding the user guide for l3fwd graph application.

Signed-off-by: Nithin Dabilpuram 
---
 MAINTAINERS   |   1 +
 doc/guides/rel_notes/release_20_05.rst|   8 +
 doc/guides/sample_app_ug/index.rst|   1 +
 doc/guides/sample_app_ug/intro.rst|   4 +
 doc/guides/sample_app_ug/l3_forward_graph.rst | 334 ++
 5 files changed, 348 insertions(+)
 create mode 100644 doc/guides/sample_app_ug/l3_forward_graph.rst

diff --git a/MAINTAINERS b/MAINTAINERS
index de57f452b..870cd8cae 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -1576,6 +1576,7 @@ F: doc/guides/sample_app_ug/l3_forward.rst
 
 M: Nithin Dabilpuram 
 F: examples/l3fwd-graph/
+F: doc/guides/sample_app_ug/l3_forward_graph.rst
 
 F: examples/link_status_interrupt/
 F: doc/guides/sample_app_ug/link_status_intr.rst
diff --git a/doc/guides/rel_notes/release_20_05.rst 
b/doc/guides/rel_notes/release_20_05.rst
index d208547ec..9d3e7bd69 100644
--- a/doc/guides/rel_notes/release_20_05.rst
+++ b/doc/guides/rel_notes/release_20_05.rst
@@ -86,6 +86,14 @@ New Features
 that can be configured through ``rte_node_ip4_rewrite_add`` function.
   * Packet drop node: Frees the packets received to their respective mempool.
 
+* **Added new l3fwd-graph sample application.**
+
+  Added an example application ``l3fwd-graph``. It demonstrates the usage of 
graph
+  library and node library for packet processing. In addition to the library 
usage
+  demonstration, this application can use for performance comparison with 
existing
+  ``l3fwd`` (The static code without any nodes) with the modular 
``l3fwd-graph``
+  approach.
+
 
 Removed Items
 -
diff --git a/doc/guides/sample_app_ug/index.rst 
b/doc/guides/sample_app_ug/index.rst
index ac3445147..cf9c1e44d 100644
--- a/doc/guides/sample_app_ug/index.rst
+++ b/doc/guides/sample_app_ug/index.rst
@@ -29,6 +29,7 @@ Sample Applications User Guides
 l2_forward_event
 l2_forward_cat
 l3_forward
+l3_forward_graph
 l3_forward_power_man
 l3_forward_access_ctrl
 link_status_intr
diff --git a/doc/guides/sample_app_ug/intro.rst 
b/doc/guides/sample_app_ug/intro.rst
index 6cd0342a1..8ff223b16 100644
--- a/doc/guides/sample_app_ug/intro.rst
+++ b/doc/guides/sample_app_ug/intro.rst
@@ -54,6 +54,10 @@ examples are highlighted below.
   forwarding, or ``l3fwd`` application does forwarding based on Internet
   Protocol, IPv4 or IPv6 like a simple router.
 
+* :doc:`Network Layer 3 forwarding Graph`: The Network Layer3
+  forwarding Graph, or ``l3fwd_graph`` application does forwarding based on 
IPv4
+  like a simple router with DPDK Graph framework.
+
 * :doc:`Hardware packet copying`: The Hardware packet copying,
   or ``ioatfwd`` application demonstrates how to use IOAT rawdev driver for
   copying packets between two threads.
diff --git a/doc/guides/sample_app_ug/l3_forward_graph.rst 
b/doc/guides/sample_app_ug/l3_forward_graph.rst
new file mode 100644
index 0..df50827ba
--- /dev/null
+++ b/doc/guides/sample_app_ug/l3_forward_graph.rst
@@ -0,0 +1,334 @@
+..  SPDX-License-Identifier: BSD-3-Clause
+Copyright(C) 2020 Marvell International Ltd.
+
+L3 Forwarding Graph Sample Application
+==
+
+The L3 Forwarding Graph application is a simple example of packet processing
+using the DPDK Graph framework. The application performs L3 forwarding using
+Graph framework and nodes written for graph framework.
+
+Overview
+
+
+The application demonstrates the use of the graph framework and graph nodes
+``ethdev_rx``, ``ip4_lookup``, ``ip4_rewrite``, ``ethdev_tx`` and ``pkt_drop`` 
in DPDK to
+implement packet forwarding.
+
+The initialization is very similar to those of the :doc:`l3_forward`.
+There is also additional initialization of graph for graph object creation
+and configuration per lcore.
+Run-time path is main thing that differs from L3 forwarding sample application.
+Difference is that forwarding logic starting from Rx, followed by LPM lookup,
+TTL update and finally Tx is implemented inside graph nodes. These nodes are
+interconnected in graph framework. Application main loop needs to walk over
+graph using ``rte_graph_walk()`` with graph objects created one per slave 
lcore.
+
+The lookup method is as per implementation of ``ip4_lookup`` graph node.
+The ID of the output interface for the input packet is the next hop returned by
+the LPM lookup. The set of LPM rules used by the application is statically
+configured and provided to ``ip4_lookup`` graph node and ``ip4_rewrite`` graph 
node
+using node control API ``rte_node_ip4_route_add()`` and 
``rte_node_ip4_rewrite_add()``.
+
+In the sample application, only IPv4 forwarding is supported as of now.
+
+Compiling the Application
+-
+
+To compile the sample application see :doc:`compiling`.
+
+The application is located in the ``l3fwd-graph`` sub-directory.
+
+Running the Applica

[dpdk-dev] [PATCH v5 27/29] l3fwd-graph: add graph config and main loop

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add graph creation, configuration logic and graph main loop.
This graph main loop is run on every slave lcore and calls
rte_graph_walk() to walk over lcore specific rte_graph.
Master core accumulates and prints graph walk stats of all the
lcore's graph's.

Signed-off-by: Nithin Dabilpuram 
---
 examples/l3fwd-graph/main.c | 248 +++-
 1 file changed, 246 insertions(+), 2 deletions(-)

diff --git a/examples/l3fwd-graph/main.c b/examples/l3fwd-graph/main.c
index 7ea788589..40108a0d3 100644
--- a/examples/l3fwd-graph/main.c
+++ b/examples/l3fwd-graph/main.c
@@ -23,9 +23,13 @@
 #include 
 #include 
 #include 
+#include 
+#include 
 #include 
 #include 
 #include 
+#include 
+#include 
 #include 
 #include 
 #include 
@@ -75,12 +79,17 @@ static uint32_t enabled_port_mask;
 struct lcore_rx_queue {
uint16_t port_id;
uint8_t queue_id;
+   char node_name[RTE_NODE_NAMESIZE];
 };
 
 /* Lcore conf */
 struct lcore_conf {
uint16_t n_rx_queue;
struct lcore_rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE];
+
+   struct rte_graph *graph;
+   char name[RTE_GRAPH_NAMESIZE];
+   rte_graph_t graph_id;
 } __rte_cache_aligned;
 
 static struct lcore_conf lcore_conf[RTE_MAX_LCORE];
@@ -119,6 +128,25 @@ static struct rte_eth_conf port_conf = {
 
 static struct rte_mempool *pktmbuf_pool[RTE_MAX_ETHPORTS][NB_SOCKETS];
 
+static struct rte_node_ethdev_config ethdev_conf[RTE_MAX_ETHPORTS];
+
+struct ipv4_l3fwd_lpm_route {
+   uint32_t ip;
+   uint8_t depth;
+   uint8_t if_out;
+};
+
+#define IPV4_L3FWD_LPM_NUM_ROUTES  
\
+   (sizeof(ipv4_l3fwd_lpm_route_array) /  \
+sizeof(ipv4_l3fwd_lpm_route_array[0]))
+/* 198.18.0.0/16 are set aside for RFC2544 benchmarking. */
+static struct ipv4_l3fwd_lpm_route ipv4_l3fwd_lpm_route_array[] = {
+   {RTE_IPV4(198, 18, 0, 0), 24, 0}, {RTE_IPV4(198, 18, 1, 0), 24, 1},
+   {RTE_IPV4(198, 18, 2, 0), 24, 2}, {RTE_IPV4(198, 18, 3, 0), 24, 3},
+   {RTE_IPV4(198, 18, 4, 0), 24, 4}, {RTE_IPV4(198, 18, 5, 0), 24, 5},
+   {RTE_IPV4(198, 18, 6, 0), 24, 6}, {RTE_IPV4(198, 18, 7, 0), 24, 7},
+};
+
 static int
 check_lcore_params(void)
 {
@@ -633,17 +661,89 @@ signal_handler(int signum)
}
 }
 
+static void
+print_stats(void)
+{
+   const char topLeft[] = {27, '[', '1', ';', '1', 'H', '\0'};
+   const char clr[] = {27, '[', '2', 'J', '\0'};
+   struct rte_graph_cluster_stats_param s_param;
+   struct rte_graph_cluster_stats *stats;
+   const char *pattern = "worker_*";
+
+   /* Prepare stats object */
+   memset(&s_param, 0, sizeof(s_param));
+   s_param.f = stdout;
+   s_param.socket_id = SOCKET_ID_ANY;
+   s_param.graph_patterns = &pattern;
+   s_param.nb_graph_patterns = 1;
+
+   stats = rte_graph_cluster_stats_create(&s_param);
+   if (stats == NULL)
+   rte_exit(EXIT_FAILURE, "Unable to create stats object\n");
+
+   while (!force_quit) {
+   /* Clear screen and move to top left */
+   printf("%s%s", clr, topLeft);
+   rte_graph_cluster_stats_get(stats, 0);
+   rte_delay_ms(1E3);
+   }
+
+   rte_graph_cluster_stats_destroy(stats);
+}
+
+/* Main processing loop */
+static int
+graph_main_loop(void *conf)
+{
+   struct lcore_conf *qconf;
+   struct rte_graph *graph;
+   uint32_t lcore_id;
+
+   RTE_SET_USED(conf);
+
+   lcore_id = rte_lcore_id();
+   qconf = &lcore_conf[lcore_id];
+   graph = qconf->graph;
+
+   if (!graph) {
+   RTE_LOG(INFO, L3FWD_GRAPH, "Lcore %u has nothing to do\n",
+   lcore_id);
+   return 0;
+   }
+
+   RTE_LOG(INFO, L3FWD_GRAPH,
+   "Entering main loop on lcore %u, graph %s(%p)\n", lcore_id,
+   qconf->name, graph);
+
+   while (likely(!force_quit))
+   rte_graph_walk(graph);
+
+   return 0;
+}
+
 int
 main(int argc, char **argv)
 {
+   /* Rewrite data of src and dst ether addr */
+   uint8_t rewrite_data[2 * sizeof(struct rte_ether_addr)];
+   static const char * const default_patterns[] = {
+   "ip4*",
+   "ethdev_tx-*",
+   "pkt_drop",
+   };
uint8_t nb_rx_queue, queue, socketid;
+   struct rte_graph_param graph_conf;
struct rte_eth_dev_info dev_info;
+   uint32_t nb_ports, nb_conf = 0;
uint32_t n_tx_queue, nb_lcores;
struct rte_eth_txconf *txconf;
-   uint16_t queueid, portid;
+   uint16_t queueid, portid, i;
+   const char **node_patterns;
struct lcore_conf *qconf;
+   uint16_t nb_graphs = 0;
+   uint16_t nb_patterns;
+   uint8_t rewrite_len;
uint32_t lcore_id;
-   uint32_t nb_ports;
int ret;
 
/* Init EAL */
@@ -792,6 +892,18 @@ main(int argc, char **argv)
   

[dpdk-dev] [PATCH v5 25/29] l3fwd-graph: add graph based l3fwd skeleton

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add graph based l3fwd application skeleton with cmdline
parsing support inline with normal l3fwd.

Signed-off-by: Nithin Dabilpuram 
---
 MAINTAINERS  |   3 +
 examples/Makefile|   3 +
 examples/l3fwd-graph/Makefile|  58 
 examples/l3fwd-graph/main.c  | 534 +++
 examples/l3fwd-graph/meson.build |  13 +
 examples/meson.build |   6 +-
 6 files changed, 615 insertions(+), 2 deletions(-)
 create mode 100644 examples/l3fwd-graph/Makefile
 create mode 100644 examples/l3fwd-graph/main.c
 create mode 100644 examples/l3fwd-graph/meson.build

diff --git a/MAINTAINERS b/MAINTAINERS
index 55fb9bbb0..de57f452b 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -1574,6 +1574,9 @@ F: doc/guides/sample_app_ug/l2_forward_event.rst
 F: examples/l3fwd/
 F: doc/guides/sample_app_ug/l3_forward.rst
 
+M: Nithin Dabilpuram 
+F: examples/l3fwd-graph/
+
 F: examples/link_status_interrupt/
 F: doc/guides/sample_app_ug/link_status_intr.rst
 
diff --git a/examples/Makefile b/examples/Makefile
index feff79784..b7e99a2f7 100644
--- a/examples/Makefile
+++ b/examples/Makefile
@@ -51,6 +51,9 @@ DIRS-$(CONFIG_RTE_LIBRTE_ACL) += l3fwd-acl
 ifeq ($(CONFIG_RTE_LIBRTE_LPM)$(CONFIG_RTE_LIBRTE_HASH),yy)
 DIRS-$(CONFIG_RTE_LIBRTE_POWER) += l3fwd-power
 endif
+ifeq ($(CONFIG_RTE_LIBRTE_GRAPH),y)
+DIRS-y += l3fwd-graph
+endif
 DIRS-y += link_status_interrupt
 DIRS-y += multi_process
 DIRS-y += ntb
diff --git a/examples/l3fwd-graph/Makefile b/examples/l3fwd-graph/Makefile
new file mode 100644
index 0..f3cf275ec
--- /dev/null
+++ b/examples/l3fwd-graph/Makefile
@@ -0,0 +1,58 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(C) 2020 Marvell International Ltd.
+
+# binary name
+APP = l3fwd-graph
+
+# all source are stored in SRCS-y
+SRCS-y := main.c
+
+# Build using pkg-config variables if possible
+ifeq ($(shell pkg-config --exists libdpdk && echo 0),0)
+
+all: shared
+.PHONY: shared static
+shared: build/$(APP)-shared
+   ln -sf $(APP)-shared build/$(APP)
+static: build/$(APP)-static
+   ln -sf $(APP)-static build/$(APP)
+
+PKGCONF=pkg-config --define-prefix
+
+PC_FILE := $(shell $(PKGCONF) --path libdpdk)
+CFLAGS += -O3 $(shell $(PKGCONF) --cflags libdpdk) -DALLOW_EXPERIMENTAL_API
+LDFLAGS_SHARED = $(shell $(PKGCONF) --libs libdpdk)
+LDFLAGS_STATIC = -Wl,-Bstatic $(shell $(PKGCONF) --static --libs libdpdk)
+
+build/$(APP)-shared: $(SRCS-y) Makefile $(PC_FILE) | build
+   $(CC) $(CFLAGS) $(SRCS-y) -o $@ $(LDFLAGS) $(LDFLAGS_SHARED)
+
+build/$(APP)-static: $(SRCS-y) Makefile $(PC_FILE) | build
+   $(CC) $(CFLAGS) $(SRCS-y) -o $@ $(LDFLAGS) $(LDFLAGS_STATIC)
+
+build:
+   @mkdir -p $@
+
+.PHONY: clean
+clean:
+   rm -f build/$(APP) build/$(APP)-static build/$(APP)-shared
+   test -d build && rmdir -p build || true
+
+else # Build using legacy build system
+
+ifeq ($(RTE_SDK),)
+$(error "Please define RTE_SDK environment variable")
+endif
+
+# Default target, detect a build directory, by looking for a path with a 
.config
+RTE_TARGET ?= $(notdir $(abspath $(dir $(firstword $(wildcard 
$(RTE_SDK)/*/.config)
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+CFLAGS += -DALLOW_EXPERIMENTAL_API
+CFLAGS += -I$(SRCDIR)
+CFLAGS += -O3 $(USER_FLAGS)
+CFLAGS += $(WERROR_FLAGS)
+
+include $(RTE_SDK)/mk/rte.extapp.mk
+endif
diff --git a/examples/l3fwd-graph/main.c b/examples/l3fwd-graph/main.c
new file mode 100644
index 0..ab6713488
--- /dev/null
+++ b/examples/l3fwd-graph/main.c
@@ -0,0 +1,534 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(C) 2020 Marvell International Ltd.
+ */
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+
+/* Log type */
+#define RTE_LOGTYPE_L3FWD_GRAPH RTE_LOGTYPE_USER1
+
+/*
+ * Configurable number of RX/TX ring descriptors
+ */
+#define RTE_TEST_RX_DESC_DEFAULT 1024
+#define RTE_TEST_TX_DESC_DEFAULT 1024
+
+#define MAX_TX_QUEUE_PER_PORT RTE_MAX_ETHPORTS
+#define MAX_RX_QUEUE_PER_PORT 128
+
+#define MAX_RX_QUEUE_PER_LCORE 16
+
+#define MAX_LCORE_PARAMS 1024
+
+#define NB_SOCKETS 8
+
+/**< Ports set in promiscuous mode off by default. */
+static int promiscuous_on;
+
+static int numa_on = 1;  /**< NUMA is enabled by default. */
+static int per_port_pool; /**< Use separate buffer pools per port; disabled */
+ /**< by default */
+
+static volatile bool force_quit;
+
+/* Ethernet addresses of ports */
+static uint64_t dest_eth_addr[RTE_MAX_ETHPORTS];
+xmm_t val_eth[RTE_MAX_ETHPORTS];
+
+/* Mask of enabled ports */
+static uint32_t enabled_port_mask;
+
+struct lcore_rx_queue {
+   uint16_t port_id;
+   uint8_t queue_id;
+};
+
+/* Lcore conf */
+struct lcore_conf {
+   uint16_t n_rx_queue;
+   s

[dpdk-dev] [PATCH v5 26/29] l3fwd-graph: add ethdev configuration changes

2020-04-11 Thread jerinj
From: Nithin Dabilpuram 

Add changes to ethdev port and queue configuration based
on command line parameters for l3fwd graph application.

Signed-off-by: Nithin Dabilpuram 
---
 examples/l3fwd-graph/main.c | 350 +++-
 1 file changed, 349 insertions(+), 1 deletion(-)

diff --git a/examples/l3fwd-graph/main.c b/examples/l3fwd-graph/main.c
index ab6713488..7ea788589 100644
--- a/examples/l3fwd-graph/main.c
+++ b/examples/l3fwd-graph/main.c
@@ -20,8 +20,10 @@
 
 #include 
 #include 
+#include 
 #include 
 #include 
+#include 
 #include 
 #include 
 #include 
@@ -49,6 +51,10 @@
 
 #define NB_SOCKETS 8
 
+/* Static global variables used within this file. */
+static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT;
+static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT;
+
 /**< Ports set in promiscuous mode off by default. */
 static int promiscuous_on;
 
@@ -60,6 +66,7 @@ static volatile bool force_quit;
 
 /* Ethernet addresses of ports */
 static uint64_t dest_eth_addr[RTE_MAX_ETHPORTS];
+static struct rte_ether_addr ports_eth_addr[RTE_MAX_ETHPORTS];
 xmm_t val_eth[RTE_MAX_ETHPORTS];
 
 /* Mask of enabled ports */
@@ -110,6 +117,8 @@ static struct rte_eth_conf port_conf = {
},
 };
 
+static struct rte_mempool *pktmbuf_pool[RTE_MAX_ETHPORTS][NB_SOCKETS];
+
 static int
 check_lcore_params(void)
 {
@@ -165,6 +174,27 @@ check_port_config(void)
return 0;
 }
 
+static uint8_t
+get_port_n_rx_queues(const uint16_t port)
+{
+   int queue = -1;
+   uint16_t i;
+
+   for (i = 0; i < nb_lcore_params; ++i) {
+   if (lcore_params[i].port_id == port) {
+   if (lcore_params[i].queue_id == queue + 1)
+   queue = lcore_params[i].queue_id;
+   else
+   rte_exit(EXIT_FAILURE,
+"Queue ids of the port %d must be"
+" in sequence and must start with 0\n",
+lcore_params[i].port_id);
+   }
+   }
+
+   return (uint8_t)(++queue);
+}
+
 static int
 init_lcore_rx_queues(void)
 {
@@ -479,6 +509,120 @@ parse_args(int argc, char **argv)
return ret;
 }
 
+static void
+print_ethaddr(const char *name, const struct rte_ether_addr *eth_addr)
+{
+   char buf[RTE_ETHER_ADDR_FMT_SIZE];
+   rte_ether_format_addr(buf, RTE_ETHER_ADDR_FMT_SIZE, eth_addr);
+   printf("%s%s", name, buf);
+}
+
+static int
+init_mem(uint16_t portid, uint32_t nb_mbuf)
+{
+   uint32_t lcore_id;
+   int socketid;
+   char s[64];
+
+   for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) {
+   if (rte_lcore_is_enabled(lcore_id) == 0)
+   continue;
+
+   if (numa_on)
+   socketid = rte_lcore_to_socket_id(lcore_id);
+   else
+   socketid = 0;
+
+   if (socketid >= NB_SOCKETS) {
+   rte_exit(EXIT_FAILURE,
+"Socket %d of lcore %u is out of range %d\n",
+socketid, lcore_id, NB_SOCKETS);
+   }
+
+   if (pktmbuf_pool[portid][socketid] == NULL) {
+   snprintf(s, sizeof(s), "mbuf_pool_%d:%d", portid,
+socketid);
+   /* Create a pool with priv size of a cacheline */
+   pktmbuf_pool[portid][socketid] =
+   rte_pktmbuf_pool_create(
+   s, nb_mbuf, MEMPOOL_CACHE_SIZE,
+   RTE_CACHE_LINE_SIZE,
+   RTE_MBUF_DEFAULT_BUF_SIZE, socketid);
+   if (pktmbuf_pool[portid][socketid] == NULL)
+   rte_exit(EXIT_FAILURE,
+"Cannot init mbuf pool on socket %d\n",
+socketid);
+   else
+   printf("Allocated mbuf pool on socket %d\n",
+  socketid);
+   }
+   }
+
+   return 0;
+}
+
+/* Check the link status of all ports in up to 9s, and print them finally */
+static void
+check_all_ports_link_status(uint32_t port_mask)
+{
+#define CHECK_INTERVAL 100 /* 100ms */
+#define MAX_CHECK_TIME 90  /* 9s (90 * 100ms) in total */
+   uint8_t count, all_ports_up, print_flag = 0;
+   struct rte_eth_link link;
+   uint16_t portid;
+
+   printf("\nChecking link status");
+   fflush(stdout);
+   for (count = 0; count <= MAX_CHECK_TIME; count++) {
+   if (force_quit)
+   return;
+   all_ports_up = 1;
+   RTE_ETH_FOREACH_DEV(portid)
+   {
+   if (force_quit)
+   return;
+   i

Re: [dpdk-dev] [PATCH dpdk-dev v2 1/2] eal: introduce rte-init queue for libraries initialization

2020-04-11 Thread Tonghao Zhang
On Fri, Apr 10, 2020 at 9:11 PM Jerin Jacob  wrote:
>
> On Fri, Apr 10, 2020 at 11:48 AM Jerin Jacob  wrote:
> >
>
> Three more items are missing in this patch
>
> 1) Unit test case for new API
> 2) Make the new API __rte_experimal
Hi Jerin
This API will be invoked in mempool, if use that prefix, there is a
compile warning:
include/rte_mempool.h:933:2: error: ‘rte_init_register’ is deprecated
(declared at x86_64-native-linuxapp-gcc/include/rte_init.h:61): Symbol
is not yet part of stable ABI [-Werror=deprecated-declarations]

remove the __rte_experimal in the patch 2?

> 3) Update the .map file
>
>
> > On Thu, Apr 9, 2020 at 8:33 PM  wrote:
> > >
> > > From: Tonghao Zhang 
> > >
> > > This patch introduces last-init queue, user can register a
> > > callback for theirs initialization. Running rte_last_init_run(),
> >
> > The above section needs to be rewritten wrt v2 changes.
> >
> > > the almost resource of DPDK are available, such as memzone, ring.
> > > With this way, user don't introduce additional codes in eal layer.
> > >
> > > [This patch will be used for next patch.]
> >
> > See below
> >
> >
> > >
> > > Signed-off-by: Tonghao Zhang 
> > > ---
> > See above
> >
> > Move [This patch will be used for next patch.] here to avoid
> > unnecessary information in the git commit.
> >
> > > v2:
> > > * rename rte_last_init_register ->rte_init_register
> > > * rename rte_last_init struct ->rte_init
> > > * rename rte_init_cb ->rte_init_cb_t
> > > * free the rte_init node when not used.
> > > * remove rte_init and others to eal_private.h
> > > * add comments
> > > * fix checkpatch warning
> > > ---
> > > diff --git a/lib/librte_eal/include/rte_init.h 
> > > b/lib/librte_eal/include/rte_init.h
> > > new file mode 100644
> > > index 000..636efff
> > > --- /dev/null
> > > +++ b/lib/librte_eal/include/rte_init.h
> > > @@ -0,0 +1,59 @@
> > > +/* SPDX-License-Identifier: BSD-3-Clause
> > > + * Copyright 2020 DPDK Community
> > > + */
> > > +
> > > +#ifndef _RTE_INIT_H_
> > > +#define _RTE_INIT_H_
> >
> > @file section is missing. See
> > lib/librte_eal/common/include/rte_errno.h as example.
> >
> >
> > > +#ifdef __cplusplus
> > > +extern "C" {
> > > +#endif
> > > +
> > > +#include 
> > > +#include 
> >
> >  is not required in public API header file.
> >
> > > +
> > > +/**
> > > + * Implementation specific callback function which is
> > > + * responsible for specificed initialization.
> > > + *
> > > + * This is called when almost resources are available.
> > > + *
> > > + * @return
> > > + * 0 for successful callback
> > > + * Negative for unsuccessful callback with error value
> > > + */
> > > +typedef int (*rte_init_cb_t)(const void *arg);
> > > +
> > > +/**
> > > + * rte_init type.
> > > + *
> > > + * The rte_init of RTE_INIT_PRE are called firstly,
> > > + * and then RTE_INIT_POST.
> > > + */
> > > +enum rte_init_type {
> > > +   RTE_INIT_PRE,
> >
> > Type specific comment is missing.
> >
> > Example as reference for formatting.
> >
> > /**
> >  * Enumerate trace mode operation.
> >  */
> > enum rte_trace_mode_e {
> > /**
> >  * In this mode, When no space left in trace buffer, the subsequent
> >  * events overwrite the old events in the trace buffer.
> >  */
> > RTE_TRACE_MODE_OVERWRITE,
> > /**
> >  * In this mode, When no space left on trace buffer, the subsequent
> >  * events shall not be recorded in the trace buffer.
> >  */
> > RTE_TRACE_MODE_DISCARD,
> > };
> >
> > > +   RTE_INIT_POST
> > > +};
> >
> >
> > > +
> > > +/**
> > > + * Register a rte_init callback.
> > > + *
> > > + * @param cb
> > > + *   A pointer to a rte_init_cb structure, which will be used
> >
> > s/used/invoked?
> >
> > > + *   in rte_eal_init().
> > > + *
> > > + * @param arg
> > > + *   The cb will use that as param.
> > > + *
> > > + * @param type
> > > + *   The type of rte_init registered.
> > > + */
> > > +
> > > +void rte_init_register(rte_init_cb_t cb, const void *arg,
> > > +  enum rte_init_type type);
> > > +
> > > +#ifdef __cplusplus
> > > +}
> > > +#endif
> > > +
> > > +#endif /* _RTE_INIT_H_ */



-- 
Best regards, Tonghao


Re: [dpdk-dev] [PATCH dpdk-dev v2 1/2] eal: introduce rte-init queue for libraries initialization

2020-04-11 Thread Tonghao Zhang
On Sun, Apr 12, 2020 at 11:20 AM Tonghao Zhang  wrote:
>
> On Fri, Apr 10, 2020 at 9:11 PM Jerin Jacob  wrote:
> >
> > On Fri, Apr 10, 2020 at 11:48 AM Jerin Jacob  wrote:
> > >
> >
> > Three more items are missing in this patch
Can I add "Co-authored-by" for you ?

> > 1) Unit test case for new API
> > 2) Make the new API __rte_experimal
> Hi Jerin
> This API will be invoked in mempool, if use that prefix, there is a
> compile warning:
> include/rte_mempool.h:933:2: error: ‘rte_init_register’ is deprecated
> (declared at x86_64-native-linuxapp-gcc/include/rte_init.h:61): Symbol
> is not yet part of stable ABI [-Werror=deprecated-declarations]
>
> remove the __rte_experimal in the patch 2?
>
> > 3) Update the .map file
> >
> >
> > > On Thu, Apr 9, 2020 at 8:33 PM  wrote:
> > > >
> > > > From: Tonghao Zhang 
> > > >
> > > > This patch introduces last-init queue, user can register a
> > > > callback for theirs initialization. Running rte_last_init_run(),
> > >
> > > The above section needs to be rewritten wrt v2 changes.
> > >
> > > > the almost resource of DPDK are available, such as memzone, ring.
> > > > With this way, user don't introduce additional codes in eal layer.
> > > >
> > > > [This patch will be used for next patch.]
> > >
> > > See below
> > >
> > >
> > > >
> > > > Signed-off-by: Tonghao Zhang 
> > > > ---
> > > See above
> > >
> > > Move [This patch will be used for next patch.] here to avoid
> > > unnecessary information in the git commit.
> > >
> > > > v2:
> > > > * rename rte_last_init_register ->rte_init_register
> > > > * rename rte_last_init struct ->rte_init
> > > > * rename rte_init_cb ->rte_init_cb_t
> > > > * free the rte_init node when not used.
> > > > * remove rte_init and others to eal_private.h
> > > > * add comments
> > > > * fix checkpatch warning
> > > > ---
> > > > diff --git a/lib/librte_eal/include/rte_init.h 
> > > > b/lib/librte_eal/include/rte_init.h
> > > > new file mode 100644
> > > > index 000..636efff
> > > > --- /dev/null
> > > > +++ b/lib/librte_eal/include/rte_init.h
> > > > @@ -0,0 +1,59 @@
> > > > +/* SPDX-License-Identifier: BSD-3-Clause
> > > > + * Copyright 2020 DPDK Community
> > > > + */
> > > > +
> > > > +#ifndef _RTE_INIT_H_
> > > > +#define _RTE_INIT_H_
> > >
> > > @file section is missing. See
> > > lib/librte_eal/common/include/rte_errno.h as example.
> > >
> > >
> > > > +#ifdef __cplusplus
> > > > +extern "C" {
> > > > +#endif
> > > > +
> > > > +#include 
> > > > +#include 
> > >
> > >  is not required in public API header file.
> > >
> > > > +
> > > > +/**
> > > > + * Implementation specific callback function which is
> > > > + * responsible for specificed initialization.
> > > > + *
> > > > + * This is called when almost resources are available.
> > > > + *
> > > > + * @return
> > > > + * 0 for successful callback
> > > > + * Negative for unsuccessful callback with error value
> > > > + */
> > > > +typedef int (*rte_init_cb_t)(const void *arg);
> > > > +
> > > > +/**
> > > > + * rte_init type.
> > > > + *
> > > > + * The rte_init of RTE_INIT_PRE are called firstly,
> > > > + * and then RTE_INIT_POST.
> > > > + */
> > > > +enum rte_init_type {
> > > > +   RTE_INIT_PRE,
> > >
> > > Type specific comment is missing.
> > >
> > > Example as reference for formatting.
> > >
> > > /**
> > >  * Enumerate trace mode operation.
> > >  */
> > > enum rte_trace_mode_e {
> > > /**
> > >  * In this mode, When no space left in trace buffer, the 
> > > subsequent
> > >  * events overwrite the old events in the trace buffer.
> > >  */
> > > RTE_TRACE_MODE_OVERWRITE,
> > > /**
> > >  * In this mode, When no space left on trace buffer, the 
> > > subsequent
> > >  * events shall not be recorded in the trace buffer.
> > >  */
> > > RTE_TRACE_MODE_DISCARD,
> > > };
> > >
> > > > +   RTE_INIT_POST
> > > > +};
> > >
> > >
> > > > +
> > > > +/**
> > > > + * Register a rte_init callback.
> > > > + *
> > > > + * @param cb
> > > > + *   A pointer to a rte_init_cb structure, which will be used
> > >
> > > s/used/invoked?
> > >
> > > > + *   in rte_eal_init().
> > > > + *
> > > > + * @param arg
> > > > + *   The cb will use that as param.
> > > > + *
> > > > + * @param type
> > > > + *   The type of rte_init registered.
> > > > + */
> > > > +
> > > > +void rte_init_register(rte_init_cb_t cb, const void *arg,
> > > > +  enum rte_init_type type);
> > > > +
> > > > +#ifdef __cplusplus
> > > > +}
> > > > +#endif
> > > > +
> > > > +#endif /* _RTE_INIT_H_ */
>
>
>
> --
> Best regards, Tonghao



-- 
Best regards, Tonghao