On Thu, Apr 25, 2024 at 07:11:30PM +0800, Jianyue Wu wrote:
> From: Jianyue Wu <jianyue...@nokia-sbell.com>
> 
> Improve the robustness of setting thread affinity in DPDK
> by adding detailed error logging.
> 
> Changes:
> 1. Check the return value of pthread_setaffinity_np() and log an error
> if the call fails.
> 2. Include the current thread name, the intended CPU set, and a detailed
> error message in the log.
> 
> Sample prints:
> EAL: Cannot set affinity for thread dpdk-test with cpus 0,
> ret: 22, errno: 0, error description: Success
> EAL: Cannot set affinity for thread dpdk-worker1 with cpus 1,
> ret: 22, errno: 0, error description: Success
> 
> Signed-off-by: Jianyue Wu <jianyue...@nokia-sbell.com>
> ---
>  lib/eal/common/eal_common_thread.c |  2 +-
>  lib/eal/common/eal_thread.h        |  2 +-
>  lib/eal/unix/rte_thread.c          | 27 +++++++++++++++++++++++++--
>  3 files changed, 27 insertions(+), 4 deletions(-)
> 
> diff --git a/lib/eal/common/eal_common_thread.c 
> b/lib/eal/common/eal_common_thread.c
> index a53bc639ae..31a2fab2a7 100644
> --- a/lib/eal/common/eal_common_thread.c
> +++ b/lib/eal/common/eal_common_thread.c
> @@ -103,7 +103,7 @@ rte_thread_get_affinity(rte_cpuset_t *cpusetp)
>  }
>  
>  int
> -eal_thread_dump_affinity(rte_cpuset_t *cpuset, char *str, unsigned int size)
> +eal_thread_dump_affinity(const rte_cpuset_t *cpuset, char *str, unsigned int 
> size)
>  {
>       unsigned cpu;
>       int ret;
> diff --git a/lib/eal/common/eal_thread.h b/lib/eal/common/eal_thread.h
> index 1c3c3442d3..85ab84baa5 100644
> --- a/lib/eal/common/eal_thread.h
> +++ b/lib/eal/common/eal_thread.h
> @@ -50,7 +50,7 @@ unsigned eal_cpu_socket_id(unsigned cpu_id);
>   *   0 for success, -1 if truncation happens.
>   */
>  int
> -eal_thread_dump_affinity(rte_cpuset_t *cpuset, char *str, unsigned int size);
> +eal_thread_dump_affinity(const rte_cpuset_t *cpuset, char *str, unsigned int 
> size);

no objection to adding const

>  
>  /**
>   * Dump the current thread cpuset.
> diff --git a/lib/eal/unix/rte_thread.c b/lib/eal/unix/rte_thread.c
> index 1b4c73f58e..34ac0eabbf 100644
> --- a/lib/eal/unix/rte_thread.c
> +++ b/lib/eal/unix/rte_thread.c
> @@ -369,8 +369,31 @@ int
>  rte_thread_set_affinity_by_id(rte_thread_t thread_id,
>               const rte_cpuset_t *cpuset)
>  {
> -     return pthread_setaffinity_np((pthread_t)thread_id.opaque_id,
> -             sizeof(*cpuset), cpuset);
> +     int ret;
> +#if defined(__linux__) && defined(_GNU_SOURCE)
> +     char cpus_str[RTE_CPU_AFFINITY_STR_LEN] = {'\0'};
> +     char thread_name[RTE_MAX_THREAD_NAME_LEN] = {'\0'};
> +     errno = 0;
> +#endif
> +
> +     ret = pthread_setaffinity_np((pthread_t)thread_id.opaque_id,
> +                             sizeof(*cpuset), cpuset);
> +
> +#if defined(__linux__) && defined(_GNU_SOURCE)
> +     if (ret != 0) {
> +             if (pthread_getname_np((pthread_t)thread_id.opaque_id,
> +                                     thread_name, sizeof(thread_name)) != 0)
> +                     EAL_LOG(ERR, "pthread_getname_np failed!");
> +             if (eal_thread_dump_affinity(cpuset, cpus_str, 
> RTE_CPU_AFFINITY_STR_LEN) != 0)
> +                     EAL_LOG(ERR, "eal_thread_dump_affinity failed!");
> +             EAL_LOG(ERR, "Cannot set affinity for thread %s with cpus %s, "
> +                     "ret: %d, errno: %d, error description: %s",
> +                     thread_name, cpus_str,
> +                     ret, errno, strerror(errno));
> +     }
> +#endif
> +
> +     return ret;
>  }
>  
>  int
> -- 

i do not think introducing os specific behavior/logging to the EAL
is a good idea. logging although not formally part of the api surface
should present the same experience for all platforms. the EAL should
have a higher standard here.

> 2.34.1

Reply via email to