Thanks for working on this.

On Wed, Sep 25, 2019 at 6:10 PM Stephen Hemminger
<step...@networkplumber.org> wrote:
>
> The internal structure of lcore_config is no longer be part of
> visible API/ABI. Make it private to EAL.
>
> Rearrange and resize the fields in the structure so it takes
> less memory (and cache footprint).

This patch is missing the release notes update.


>
> Signed-off-by: Stephen Hemminger <step...@networkplumber.org>
> ---
> v7 - add eal_private.h to windows
>
>  lib/librte_eal/common/eal_common_launch.c |  2 ++
>  lib/librte_eal/common/eal_private.h       | 22 +++++++++++++++++++++
>  lib/librte_eal/common/include/rte_lcore.h | 24 -----------------------
>  lib/librte_eal/common/rte_service.c       |  2 ++
>  lib/librte_eal/rte_eal_version.map        |  1 -
>  lib/librte_eal/windows/eal/eal_thread.c   |  1 +
>  6 files changed, 27 insertions(+), 25 deletions(-)
>
> diff --git a/lib/librte_eal/common/eal_common_launch.c 
> b/lib/librte_eal/common/eal_common_launch.c
> index fe0ba3f0d617..cf52d717f68e 100644
> --- a/lib/librte_eal/common/eal_common_launch.c
> +++ b/lib/librte_eal/common/eal_common_launch.c
> @@ -15,6 +15,8 @@
>  #include <rte_per_lcore.h>
>  #include <rte_lcore.h>
>
> +#include "eal_private.h"
> +
>  /*
>   * Wait until a lcore finished its job.
>   */
> diff --git a/lib/librte_eal/common/eal_private.h 
> b/lib/librte_eal/common/eal_private.h
> index 798ede553b21..25e80547904f 100644
> --- a/lib/librte_eal/common/eal_private.h
> +++ b/lib/librte_eal/common/eal_private.h
> @@ -10,6 +10,28 @@
>  #include <stdio.h>
>
>  #include <rte_dev.h>
> +#include <rte_lcore.h>
> +
> +/**
> + * Structure storing internal configuration (per-lcore)
> + */
> +struct lcore_config {
> +       uint32_t core_id;      /**< core number on socket for this lcore */
> +       uint32_t core_index;   /**< relative index, starting from 0 */
> +       uint16_t socket_id;    /**< physical socket id for this lcore */
> +       uint8_t core_role;         /**< role of core eg: OFF, RTE, SERVICE */
> +       uint8_t detected;          /**< true if lcore was detected */
> +       volatile enum rte_lcore_state_t state; /**< lcore state */
> +       rte_cpuset_t cpuset;       /**< cpu set which the lcore affinity to */
> +       pthread_t thread_id;       /**< pthread identifier */
> +       int pipe_master2slave[2];  /**< communication pipe with master */
> +       int pipe_slave2master[2];  /**< communication pipe with master */
> +       lcore_function_t * volatile f;         /**< function to call */
> +       void * volatile arg;       /**< argument of function */
> +       volatile int ret;          /**< return value of function */
> +};
> +
> +extern struct lcore_config lcore_config[RTE_MAX_LCORE];

Everything but cpuset can fit in a cache line.
You could just move the cpuset field at the end of the structure and
change detected to uint8_t.
This gives the following layout:

struct lcore_config {
    pthread_t                  thread_id;            /*     0     8 */
    int                        pipe_master2slave[2]; /*     8     8 */
    int                        pipe_slave2master[2]; /*    16     8 */
    volatile lcore_function_t *  f;                  /*    24     8 */
    volatile void *            arg;                  /*    32     8 */
    volatile int               ret;                  /*    40     4 */
    volatile enum rte_lcore_state_t  state;          /*    44     4 */
    unsigned int               socket_id;            /*    48     4 */
    unsigned int               core_id;              /*    52     4 */
    int                        core_index;           /*    56     4 */
    uint8_t                    detected;             /*    60     1 */
    uint8_t                    core_role;            /*    61     1 */

    /* XXX 2 bytes hole, try to pack */

    /* --- cacheline 1 boundary (64 bytes) --- */
    rte_cpuset_t               cpuset;               /*    64   128 */
    /* --- cacheline 3 boundary (192 bytes) --- */

    /* size: 192, cachelines: 3, members: 13 */
    /* sum members: 190, holes: 1, sum holes: 2 */
};

The resulting structure is only two bytes bigger than your proposal
and does not touch existing integer types (avoiding the risk of some
integer conversion on socket_id for example).


-- 
David Marchand

Reply via email to