On Fri, Jan 17, 2025 at 05:33:31PM -0700, Ahmed Zaki wrote:
> Add a new netdev flag "rx_cpu_rmap_auto". Drivers supporting ARFS should
> set the flag via netif_enable_cpu_rmap() and core will allocate and manage
> the ARFS rmap. Freeing the rmap is also done by core when the netdev is
> freed.
> 
> For better IRQ affinity management, move the IRQ rmap notifier inside the
> napi_struct. Consequently, add new notify.notify and notify.release
> functions: netif_irq_cpu_rmap_notify() and netif_napi_affinity_release().
> 
> Acked-by: David Arinzon <darin...@amazon.com>
> Signed-off-by: Ahmed Zaki <ahmed.z...@intel.com>

[...]

> diff --git a/net/core/dev.c b/net/core/dev.c
> index fe5f5855593d..dbb63005bc2b 100644
> --- a/net/core/dev.c
> +++ b/net/core/dev.c
> @@ -6862,6 +6862,141 @@ void netif_queue_set_napi(struct net_device *dev, 
> unsigned int queue_index,
>  }
>  EXPORT_SYMBOL(netif_queue_set_napi);
>  
> +#ifdef CONFIG_RFS_ACCEL
> +static void
> +netif_irq_cpu_rmap_notify(struct irq_affinity_notify *notify,
> +                       const cpumask_t *mask)
> +{
> +     struct napi_struct *napi =
> +             container_of(notify, struct napi_struct, notify);
> +     struct cpu_rmap *rmap = napi->dev->rx_cpu_rmap;
> +     int err;

I wonder if this generates a warning with some compilers? err is
defined not used if !napi->dev->rx_cpu_rmap_auto ? Not sure.

> +     if (napi->dev->rx_cpu_rmap_auto) {
> +             err = cpu_rmap_update(rmap, napi->napi_rmap_idx, mask);
> +             if (err)
> +                     pr_warn("%s: RMAP update failed (%d)\n",
> +                             __func__, err);
> +     }
> +}
> +
> +static void netif_napi_affinity_release(struct kref *ref)
> +{
> +     struct napi_struct *napi =
> +             container_of(ref, struct napi_struct, notify.kref);
> +     struct cpu_rmap *rmap = napi->dev->rx_cpu_rmap;
> +
> +     if (!napi->dev->rx_cpu_rmap_auto)
> +             return;
> +     rmap->obj[napi->napi_rmap_idx] = NULL;
> +     napi->napi_rmap_idx = -1;
> +     cpu_rmap_put(rmap);
> +}
> +
> +static int napi_irq_cpu_rmap_add(struct napi_struct *napi, int irq)
> +{
> +     struct cpu_rmap *rmap = napi->dev->rx_cpu_rmap;
> +     int rc;
> +
> +     if (!rmap)
> +             return -EINVAL;
> +
> +     napi->notify.notify = netif_irq_cpu_rmap_notify;
> +     napi->notify.release = netif_napi_affinity_release;

Maybe the callbacks should only be set at the end after everything
else is successful, just before the return 0 ?

> +     cpu_rmap_get(rmap);
> +     rc = cpu_rmap_add(rmap, napi);
> +     if (rc < 0)
> +             goto err_add;
> +
> +     napi->napi_rmap_idx = rc;
> +     rc = irq_set_affinity_notifier(irq, &napi->notify);
> +     if (rc)
> +             goto err_set;
> +
> +     return 0;
> +
> +err_set:
> +     rmap->obj[napi->napi_rmap_idx] = NULL;
> +     napi->napi_rmap_idx = -1;
> +err_add:
> +     cpu_rmap_put(rmap);
> +     return rc;
> +}

[...]

> +void netif_napi_set_irq_locked(struct napi_struct *napi, int irq)
> +{
> +     int rc;
> +
> +     if (!napi->dev->rx_cpu_rmap_auto)
> +             goto out;

Maybe the above if statement could be extended to be something like:

if (!napi->dev->rx_cpu_rmap_auto || napi->irq < 0)
  goto out;

then you can omit the irq > 0 checks in the code below, potentially?

> +     /* Remove existing rmap entries */
> +     if (napi->irq != irq && napi->irq > 0)
> +             irq_set_affinity_notifier(napi->irq, NULL);
> +
> +     if (irq > 0) {
> +             rc = napi_irq_cpu_rmap_add(napi, irq);
> +             if (rc) {
> +                     netdev_warn(napi->dev, "Unable to update ARFS map 
> (%d)\n",
> +                                 rc);
> +                     netif_disable_cpu_rmap(napi->dev);
> +             }
> +     }
> +
> +out:
> +     napi->irq = irq;
> +}
> +EXPORT_SYMBOL(netif_napi_set_irq_locked);
> +

Reply via email to