[dpdk-dev] [PATCH v5] eal: add generic thread-local-storage functions

2020-12-26 Thread Tal Shnaiderman
Add support for tls functionality in EAL.

The following functions are added:
rte_thread_tls_create_key - function to create a tls data key.
rte_thread_tls_delete_key - function to delete a tls data key.
rte_thread_tls_set_value - function to set value bound to the tls key
rte_thread_tls_get_value - function to get value bound to the tls key

tls key will be defined by the new type rte_tls_key

Windows implementation is under librte_eal/windows and
implemented using WIN32 API for Windows only.

common implementation is under librte_eal/common and
implemented using pthread for UNIX and Windows compilation
using extenral pthread libraries, when supported.

Signed-off-by: Tal Shnaiderman 
---
v3: switch from pthread shim to generic eal implementation [DmitryK]
v4: modify file names, function names, move unix code to common
for future external pthreads support [DmitryK]
v5: rename var used for extenal pthreads, add description in
meson_options.txt. [DmitryK]
---
 lib/librte_eal/common/meson.build   |  1 +
 lib/librte_eal/common/rte_thread.c  | 86 
 lib/librte_eal/include/meson.build  |  1 +
 lib/librte_eal/include/rte_thread.h | 88 +
 lib/librte_eal/rte_eal_exports.def  |  5 +++
 lib/librte_eal/version.map  |  6 +++
 lib/librte_eal/windows/meson.build  |  6 +++
 lib/librte_eal/windows/rte_thread.c | 82 ++
 meson_options.txt   |  2 +
 9 files changed, 277 insertions(+)
 create mode 100644 lib/librte_eal/common/rte_thread.c
 create mode 100644 lib/librte_eal/include/rte_thread.h
 create mode 100644 lib/librte_eal/windows/rte_thread.c

diff --git a/lib/librte_eal/common/meson.build 
b/lib/librte_eal/common/meson.build
index 39abf7a0a4..69c88b3349 100644
--- a/lib/librte_eal/common/meson.build
+++ b/lib/librte_eal/common/meson.build
@@ -77,6 +77,7 @@ sources += files(
'rte_random.c',
'rte_reciprocal.c',
'rte_service.c',
+   'rte_thread.c',
 )
 
 if is_linux
diff --git a/lib/librte_eal/common/rte_thread.c 
b/lib/librte_eal/common/rte_thread.c
new file mode 100644
index 00..56a182d1f1
--- /dev/null
+++ b/lib/librte_eal/common/rte_thread.c
@@ -0,0 +1,86 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright 2020 Mellanox Technologies, Ltd
+ */
+
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+
+struct eal_tls_key {
+   pthread_key_t thread_index;
+};
+
+int
+rte_thread_tls_create_key(rte_tls_key *key, void (*destructor)(void *))
+{
+   int err;
+
+   *key = malloc(sizeof(struct eal_tls_key));
+   if ((*key) == NULL) {
+   RTE_LOG(DEBUG, EAL, "Cannot allocate tls key.");
+   return -1;
+   }
+   err = pthread_key_create(&((*key)->thread_index), destructor);
+   if (err) {
+   RTE_LOG(DEBUG, EAL, "pthread_key_create failed: %s\n",
+strerror(err));
+   free(*key);
+   return -1;
+   }
+   return 0;
+}
+
+int
+rte_thread_tls_delete_key(rte_tls_key key)
+{
+   int err;
+
+   if (!key) {
+   RTE_LOG(DEBUG, EAL, "invalid tls key passed to function.\n");
+   return -1;
+   }
+   err = pthread_key_delete(key->thread_index);
+   if (err) {
+   RTE_LOG(DEBUG, EAL, "pthread_key_delete failed: %s\n",
+strerror(err));
+   free(key);
+   return -1;
+   }
+   free(key);
+   return 0;
+}
+
+int
+rte_thread_tls_set_value(rte_tls_key key, const void *value)
+{
+   int err;
+
+   if (!key) {
+   RTE_LOG(DEBUG, EAL, "invalid tls key passed to function.\n");
+   return -1;
+   }
+   err = pthread_setspecific(key->thread_index, value);
+   if (err) {
+   RTE_LOG(DEBUG, EAL, "pthread_setspecific failed: %s\n",
+   strerror(err));
+   return -1;
+   }
+   return 0;
+}
+
+void *
+rte_thread_tls_get_value(rte_tls_key key)
+{
+   if (!key) {
+   RTE_LOG(DEBUG, EAL, "invalid tls key passed to function.\n");
+   rte_errno = EINVAL;
+   return NULL;
+   }
+   return pthread_getspecific(key->thread_index);
+}
diff --git a/lib/librte_eal/include/meson.build 
b/lib/librte_eal/include/meson.build
index dc007084ff..0dea342e1d 100644
--- a/lib/librte_eal/include/meson.build
+++ b/lib/librte_eal/include/meson.build
@@ -40,6 +40,7 @@ headers += files(
'rte_service_component.h',
'rte_string_fns.h',
'rte_tailq.h',
+   'rte_thread.h',
'rte_time.h',
'rte_trace.h',
'rte_trace_point.h',
diff --git a/lib/librte_eal/include/rte_thread.h 
b/lib/librte_eal/include/rte_thread.h
new file mode 100644
index 00..d1206586a5
--- /dev/null
+++ b/lib/librte_eal/include/rte_thread.h
@@ -0,0 +1,88 @@
+/* SPDX-License-Identifier: BSD-3-Cl

[dpdk-dev] [PATCH] mlx5: split multi-threaded flows per OS

2020-12-26 Thread Tal Shnaiderman
multi-threaded flows feature uses pthread function pthread_key_create
but for Windows the destruction option in the function is unimplemented.

to resolve it Windows will implement destruction mechanism to cleanup
mlx5_flow_workspace object for each terminated thread.

Linux flow will keep the current behavior.

Signed-off-by: Tal Shnaiderman 
Acked-by: Matan Azrad 
---
Depends-on: patch-85737 ("eal: add generic thread-local-storage functions")
---
 drivers/net/mlx5/linux/meson.build  |   1 +
 drivers/net/mlx5/linux/mlx5_flow_os.c   |  39 +++
 drivers/net/mlx5/mlx5.c |   8 ++
 drivers/net/mlx5/mlx5_flow.c|  29 +-
 drivers/net/mlx5/mlx5_flow.h|  10 ++
 drivers/net/mlx5/windows/mlx5_flow_os.c | 174 
 6 files changed, 237 insertions(+), 24 deletions(-)
 create mode 100644 drivers/net/mlx5/linux/mlx5_flow_os.c

diff --git a/drivers/net/mlx5/linux/meson.build 
b/drivers/net/mlx5/linux/meson.build
index 6c4402169e..8412edce78 100644
--- a/drivers/net/mlx5/linux/meson.build
+++ b/drivers/net/mlx5/linux/meson.build
@@ -9,5 +9,6 @@ sources += files(
'mlx5_verbs.c',
'mlx5_mp_os.c',
'mlx5_vlan_os.c',
+   'mlx5_flow_os.c',
 )
 
diff --git a/drivers/net/mlx5/linux/mlx5_flow_os.c 
b/drivers/net/mlx5/linux/mlx5_flow_os.c
new file mode 100644
index 00..9e98966c38
--- /dev/null
+++ b/drivers/net/mlx5/linux/mlx5_flow_os.c
@@ -0,0 +1,39 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright 2020 Mellanox Technologies, Ltd
+ */
+
+#include "mlx5_flow_os.h"
+
+#include 
+
+/* Key of thread specific flow workspace data. */
+static rte_tls_key key_workspace;
+
+int
+mlx5_flow_os_init_workspace_once(void)
+{
+   if (rte_thread_tls_create_key(&key_workspace, flow_release_workspace)) {
+   DRV_LOG(ERR, "Can't create flow workspace data thread key.");
+   return ENOMEM;
+   }
+   return 0;
+}
+
+void *
+mlx5_flow_os_get_specific_workspace(void)
+{
+   return rte_thread_tls_get_value(key_workspace);
+}
+
+int
+mlx5_flow_os_set_specific_workspace(struct mlx5_flow_workspace *data)
+{
+   return rte_thread_tls_set_value(key_workspace, data);
+}
+
+void
+mlx5_flow_os_release_workspace(void)
+{
+   rte_thread_tls_delete_key(key_workspace);
+}
+
diff --git a/drivers/net/mlx5/mlx5.c b/drivers/net/mlx5/mlx5.c
index 2aa269b13e..0fdcd0fe8d 100644
--- a/drivers/net/mlx5/mlx5.c
+++ b/drivers/net/mlx5/mlx5.c
@@ -1004,6 +1004,11 @@ mlx5_alloc_shared_dev_ctx(const struct 
mlx5_dev_spawn_data *spawn,
err = rte_errno;
goto error;
}
+   if (LIST_EMPTY(&mlx5_dev_ctx_list)) {
+   err = mlx5_flow_os_init_workspace_once();
+   if (err)
+   goto error;
+   }
mlx5_flow_aging_init(sh);
mlx5_flow_counters_mng_init(sh);
mlx5_flow_ipool_create(sh, config);
@@ -1079,6 +1084,9 @@ mlx5_free_shared_dev_ctx(struct mlx5_dev_ctx_shared *sh)
mlx5_mr_release_cache(&sh->share_cache);
/* Remove context from the global device list. */
LIST_REMOVE(sh, next);
+   /* Release flow workspaces objects on the last device. */
+   if (LIST_EMPTY(&mlx5_dev_ctx_list))
+   mlx5_flow_os_release_workspace();
pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
/*
 *  Ensure there is no async event handler installed.
diff --git a/drivers/net/mlx5/mlx5_flow.c b/drivers/net/mlx5/mlx5_flow.c
index f110c6b714..a2a294eac2 100644
--- a/drivers/net/mlx5/mlx5_flow.c
+++ b/drivers/net/mlx5/mlx5_flow.c
@@ -696,11 +696,6 @@ static struct mlx5_flow_tunnel_info tunnels_info[] = {
},
 };
 
-/* Key of thread specific flow workspace data. */
-static pthread_key_t key_workspace;
-
-/* Thread specific flow workspace data once initialization data. */
-static pthread_once_t key_workspace_init;
 
 
 /**
@@ -5698,7 +5693,7 @@ mlx5_flow_start_default(struct rte_eth_dev *dev)
 /**
  * Release key of thread specific flow workspace data.
  */
-static void
+void
 flow_release_workspace(void *data)
 {
struct mlx5_flow_workspace *wks = data;
@@ -5712,16 +5707,6 @@ flow_release_workspace(void *data)
}
 }
 
-/**
- * Initialize key of thread specific flow workspace data.
- */
-static void
-flow_alloc_workspace(void)
-{
-   if (pthread_key_create(&key_workspace, flow_release_workspace))
-   DRV_LOG(ERR, "Can't create flow workspace data thread key.");
-}
-
 /**
  * Get thread specific current flow workspace.
  *
@@ -5732,7 +5717,7 @@ mlx5_flow_get_thread_workspace(void)
 {
struct mlx5_flow_workspace *data;
 
-   data = pthread_getspecific(key_workspace);
+   data = mlx5_flow_os_get_specific_workspace();
MLX5_ASSERT(data && data->inuse);
if (!data || !data->inuse)
DRV_LOG(ERR, "flow workspace not initialized.");
@@ -5780,11 +5765,7 @@ mlx5_flow_push_thread_workspace(void)
struct mlx

[dpdk-dev] [PATCH 1/2] pdump: use rte_pktmbuf_free bulk

2020-12-26 Thread Stephen Hemminger
Use rte_pktmbuf_free_bulk instead of loop when freeing
packets.

Signed-off-by: Stephen Hemminger 
---
 app/pdump/main.c | 8 
 lib/librte_pdump/rte_pdump.c | 6 +++---
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/app/pdump/main.c b/app/pdump/main.c
index b34bf335317b..f986c7e9d67e 100644
--- a/app/pdump/main.c
+++ b/app/pdump/main.c
@@ -477,10 +477,10 @@ pdump_rxtx(struct rte_ring *ring, uint16_t vdev_id, 
struct pdump_stats *stats)
stats->tx_pkts += nb_in_txd;
 
if (unlikely(nb_in_txd < nb_in_deq)) {
-   do {
-   rte_pktmbuf_free(rxtx_bufs[nb_in_txd]);
-   stats->freed_pkts++;
-   } while (++nb_in_txd < nb_in_deq);
+   unsigned int drops = nb_in_deq - nb_in_txd;
+
+   rte_pktmbuf_free_bulk(&rxtx_bufs[nb_in_txd], drops);
+   stats->freed_pkts += drops;;
}
}
 }
diff --git a/lib/librte_pdump/rte_pdump.c b/lib/librte_pdump/rte_pdump.c
index b3c8d5ce4384..3c11bd795bc1 100644
--- a/lib/librte_pdump/rte_pdump.c
+++ b/lib/librte_pdump/rte_pdump.c
@@ -93,11 +93,11 @@ pdump_copy(struct rte_mbuf **pkts, uint16_t nb_pkts, void 
*user_params)
 
ring_enq = rte_ring_enqueue_burst(ring, (void *)dup_bufs, d_pkts, NULL);
if (unlikely(ring_enq < d_pkts)) {
+   unsigned int drops = d_pkts - ring_enq;
+
PDUMP_LOG(DEBUG,
"only %d of packets enqueued to ring\n", ring_enq);
-   do {
-   rte_pktmbuf_free(dup_bufs[ring_enq]);
-   } while (++ring_enq < d_pkts);
+   rte_pktmbuf_free_bulk(&dup_bufs[ring_enq], drops);
}
 }
 
-- 
2.29.2



[dpdk-dev] [PATCH 2/2] pdump: replace DEVICE_ID_SIZE with RTE_DEV_NAME_MAX_LEN

2020-12-26 Thread Stephen Hemminger
The device string has an existing size in rte_dev.h
use that instead of defining our own.

Signed-off-by: Stephen Hemminger 
---
 lib/librte_pdump/rte_pdump.c | 13 +
 1 file changed, 5 insertions(+), 8 deletions(-)

diff --git a/lib/librte_pdump/rte_pdump.c b/lib/librte_pdump/rte_pdump.c
index 3c11bd795bc1..14a392ef0340 100644
--- a/lib/librte_pdump/rte_pdump.c
+++ b/lib/librte_pdump/rte_pdump.c
@@ -12,8 +12,6 @@
 
 #include "rte_pdump.h"
 
-#define DEVICE_ID_SIZE 64
-
 RTE_LOG_REGISTER(pdump_logtype, lib.pdump, NOTICE);
 
 /* Macro for printing using RTE_LOG */
@@ -39,14 +37,14 @@ struct pdump_request {
uint32_t flags;
union pdump_data {
struct enable_v1 {
-   char device[DEVICE_ID_SIZE];
+   char device[RTE_DEV_NAME_MAX_LEN];
uint16_t queue;
struct rte_ring *ring;
struct rte_mempool *mp;
void *filter;
} en_v1;
struct disable_v1 {
-   char device[DEVICE_ID_SIZE];
+   char device[RTE_DEV_NAME_MAX_LEN];
uint16_t queue;
struct rte_ring *ring;
struct rte_mempool *mp;
@@ -485,9 +483,8 @@ rte_pdump_enable(uint16_t port, uint16_t queue, uint32_t 
flags,
struct rte_mempool *mp,
void *filter)
 {
-
-   int ret = 0;
-   char name[DEVICE_ID_SIZE];
+   int ret;
+   char name[RTE_DEV_NAME_MAX_LEN];
 
ret = pdump_validate_port(port, name);
if (ret < 0)
@@ -531,7 +528,7 @@ int
 rte_pdump_disable(uint16_t port, uint16_t queue, uint32_t flags)
 {
int ret = 0;
-   char name[DEVICE_ID_SIZE];
+   char name[RTE_DEV_NAME_MAX_LEN];
 
ret = pdump_validate_port(port, name);
if (ret < 0)
-- 
2.29.2