On Sun, Jul 19, 2020 at 12:09 PM Thomas Monjalon <tho...@monjalon.net> wrote: > > The detection of the CPU was done in a constructor and shared > in a global variable. > > This variable may not be visible in the net PMD > because it was not exported as part of the .map file. > It is fixed by exporting a function, which is cleaner than a variable. > > By checking the CPU only at the first call of the function, > doing the check in a constructor becomes useless. > Note: the priority of the constructor was probably irrelevant. > > At the same time, the comments are reworded or dropped if useless. > > Fixes: 4c204fe5e5d2 ("common/mlx5: disable relaxed ordering in unsuitable > CPUs") > Cc: shi...@mellanox.com > Cc: sta...@dpdk.org > > Signed-off-by: Thomas Monjalon <tho...@monjalon.net> > --- > drivers/common/mlx5/linux/mlx5_common_verbs.c | 2 +- > drivers/common/mlx5/mlx5_common.c | 53 ++++++++----------- > drivers/common/mlx5/mlx5_common.h | 4 +- > .../common/mlx5/rte_common_mlx5_version.map | 2 + > drivers/net/mlx5/mlx5_flow_dv.c | 2 +- > 5 files changed, 28 insertions(+), 35 deletions(-) > > diff --git a/drivers/common/mlx5/linux/mlx5_common_verbs.c > b/drivers/common/mlx5/linux/mlx5_common_verbs.c > index a2fc7a36bd..31ac20fe09 100644 > --- a/drivers/common/mlx5/linux/mlx5_common_verbs.c > +++ b/drivers/common/mlx5/linux/mlx5_common_verbs.c > @@ -55,7 +55,7 @@ mlx5_common_verbs_reg_mr(void *pd, void *addr, size_t > length, > memset(pmd_mr, 0, sizeof(*pmd_mr)); > ibv_mr = mlx5_glue->reg_mr(pd, addr, length, > IBV_ACCESS_LOCAL_WRITE | > - (haswell_broadwell_cpu ? 0 : > + (mlx5_cpu_is_haswell_broadwell() ? 0 : > IBV_ACCESS_RELAXED_ORDERING)); > if (!ibv_mr) > return -1; > diff --git a/drivers/common/mlx5/mlx5_common.c > b/drivers/common/mlx5/mlx5_common.c > index 693e2c68c8..7232d5131d 100644 > --- a/drivers/common/mlx5/mlx5_common.c > +++ b/drivers/common/mlx5/mlx5_common.c > @@ -20,8 +20,6 @@ int mlx5_common_logtype; > const struct mlx5_glue *mlx5_glue; > #endif > > -uint8_t haswell_broadwell_cpu; > - > static int > mlx5_class_check_handler(__rte_unused const char *key, const char *value, > void *opaque) > @@ -59,19 +57,8 @@ mlx5_class_get(struct rte_devargs *devargs) > } > > > -/* In case this is an x86_64 intel processor to check if > - * we should use relaxed ordering. > - */ > #ifdef RTE_ARCH_X86_64 > -/** > - * This function returns processor identification and feature information > - * into the registers. > - * > - * @param eax, ebx, ecx, edx > - * Pointers to the registers that will hold cpu information. > - * @param level > - * The main category of information returned. > - */ > +/* Processor identification and feature information filled in registers. */
Nit, no need for inline. > static inline void mlx5_cpu_id(unsigned int level, > unsigned int *eax, unsigned int *ebx, > unsigned int *ecx, unsigned int *edx) > @@ -97,17 +84,7 @@ RTE_INIT_PRIO(mlx5_glue_init, CLASS) > mlx5_glue_constructor(); > } > > -/** > - * This function is responsible of initializing the variable > - * haswell_broadwell_cpu by checking if the cpu is intel > - * and reading the data returned from mlx5_cpu_id(). > - * since haswell and broadwell cpus don't have improved performance > - * when using relaxed ordering we want to check the cpu type before > - * before deciding whether to enable RO or not. > - * if the cpu is haswell or broadwell the variable will be set to 1 > - * otherwise it will be 0. > - */ > -RTE_INIT_PRIO(mlx5_is_haswell_broadwell_cpu, LOG) > +static bool mlx5_x86_is_haswell_broadwell(void) > { > #ifdef RTE_ARCH_X86_64 > unsigned int broadwell_models[4] = {0x3d, 0x47, 0x4F, 0x56}; > @@ -125,8 +102,7 @@ RTE_INIT_PRIO(mlx5_is_haswell_broadwell_cpu, LOG) > vendor = ebx; > max_level = eax; > if (max_level < 1) { > - haswell_broadwell_cpu = 0; > - return; > + return false; > } > mlx5_cpu_id(1, &eax, &ebx, &ecx, &edx); > model = (eax >> 4) & 0x0f; > @@ -140,18 +116,31 @@ RTE_INIT_PRIO(mlx5_is_haswell_broadwell_cpu, LOG) > if (brand_id == 0 && family == 0x6) { > for (i = 0; i < RTE_DIM(broadwell_models); i++) > if (model == broadwell_models[i]) { > - haswell_broadwell_cpu = 1; > - return; > + return true; > } > for (i = 0; i < RTE_DIM(haswell_models); i++) > if (model == haswell_models[i]) { > - haswell_broadwell_cpu = 1; > - return; > + return true; > } > } > } > #endif > - haswell_broadwell_cpu = 0; > + return false; > +} > + > +/* > + * Check if the CPU is Intel Haswell or Broadwell, > + * because PCI relaxed ordering has no performance benefit with these CPUs. > + */ > +bool mlx5_cpu_is_haswell_broadwell(void) > +{ > + static bool haswell_broadwell_cpu; > + static bool once = false; > + > + if (once) > + return haswell_broadwell_cpu; > + once = true; > + return haswell_broadwell_cpu = mlx5_x86_is_haswell_broadwell(); > } > > /** > diff --git a/drivers/common/mlx5/mlx5_common.h > b/drivers/common/mlx5/mlx5_common.h > index 2851507058..d453e0b3d8 100644 > --- a/drivers/common/mlx5/mlx5_common.h > +++ b/drivers/common/mlx5/mlx5_common.h > @@ -243,6 +243,9 @@ struct mlx5_klm { > > LIST_HEAD(mlx5_dbr_page_list, mlx5_devx_dbr_page); > > +__rte_internal > +bool mlx5_cpu_is_haswell_broadwell(void); > + > __rte_internal > enum mlx5_class mlx5_class_get(struct rte_devargs *devargs); > __rte_internal > @@ -255,6 +258,5 @@ int64_t mlx5_get_dbr(void *ctx, struct > mlx5_dbr_page_list *head, > __rte_internal > int32_t mlx5_release_dbr(struct mlx5_dbr_page_list *head, uint32_t umem_id, > uint64_t offset); > -extern uint8_t haswell_broadwell_cpu; > > #endif /* RTE_PMD_MLX5_COMMON_H_ */ > diff --git a/drivers/common/mlx5/rte_common_mlx5_version.map > b/drivers/common/mlx5/rte_common_mlx5_version.map > index ae57ebdba5..501b9fff3b 100644 > --- a/drivers/common/mlx5/rte_common_mlx5_version.map > +++ b/drivers/common/mlx5/rte_common_mlx5_version.map > @@ -6,6 +6,8 @@ INTERNAL { > mlx5_common_verbs_reg_mr; > mlx5_common_verbs_dereg_mr; > > + mlx5_cpu_is_haswell_broadwell; > + > mlx5_create_mr_ext; > > mlx5_dev_to_pci_addr; > diff --git a/drivers/net/mlx5/mlx5_flow_dv.c b/drivers/net/mlx5/mlx5_flow_dv.c > index 8b5b6838fa..f1109ae095 100644 > --- a/drivers/net/mlx5/mlx5_flow_dv.c > +++ b/drivers/net/mlx5/mlx5_flow_dv.c > @@ -4201,7 +4201,7 @@ flow_dv_create_counter_stat_mem_mng(struct rte_eth_dev > *dev, int raws_n) > mkey_attr.klm_num = 0; > if (priv->config.hca_attr.relaxed_ordering_write && > priv->config.hca_attr.relaxed_ordering_read && > - !haswell_broadwell_cpu) > + !mlx5_cpu_is_haswell_broadwell()) > mkey_attr.relaxed_ordering = 1; > mem_mng->dm = mlx5_devx_cmd_mkey_create(sh->ctx, &mkey_attr); > if (!mem_mng->dm) { > -- > 2.27.0 > I ended up on this constructor hack while looking at the common code. This patch makes sense. Reviewed-by: David Marchand <david.march...@redhat.com> -- David Marchand