Hi, Yotam

On 2017/9/25 13:38, Yotam Gigi wrote:
> On 09/25/2017 04:19 AM, Yunsheng Lin wrote:
>> Hi, Jiri
>>
>> On 2017/9/25 1:22, Jiri Pirko wrote:
>>> From: Yotam Gigi <yot...@mellanox.com>
>>>
>>> Make the ipmr module register as a FIB notifier. To do that, implement both
>>> the ipmr_seq_read and ipmr_dump ops.
>>>
>>> The ipmr_seq_read op returns a sequence counter that is incremented on
>>> every notification related operation done by the ipmr. To implement that,
>>> add a sequence counter in the netns_ipv4 struct and increment it whenever a
>>> new MFC route or VIF are added or deleted. The sequence operations are
>>> protected by the RTNL lock.
>>>
>>> The ipmr_dump iterates the list of MFC routes and the list of VIF entries
>>> and sends notifications about them. The entries dump is done under RCU
>>> where the VIF dump uses the mrt_lock too, as the vif->dev field can change
>>> under RCU.
>>>
>>> Signed-off-by: Yotam Gigi <yot...@mellanox.com>
>>> Reviewed-by: Ido Schimmel <ido...@mellanox.com>
>>> Signed-off-by: Jiri Pirko <j...@mellanox.com>
>>> ---
>>> v1->v2:
>>>  - Take the mrt_lock when dumping VIF entries.
>>> ---
>>>  include/linux/mroute.h   |  15 ++++++
>>>  include/net/netns/ipv4.h |   3 ++
>>>  net/ipv4/ipmr.c          | 137 
>>> ++++++++++++++++++++++++++++++++++++++++++++++-
>>>  3 files changed, 153 insertions(+), 2 deletions(-)
>>>
>>> diff --git a/include/linux/mroute.h b/include/linux/mroute.h
>>> index 10028f2..54c5cb8 100644
>>> --- a/include/linux/mroute.h
>>> +++ b/include/linux/mroute.h
>>> @@ -5,6 +5,7 @@
>>>  #include <linux/pim.h>
>>>  #include <linux/rhashtable.h>
>>>  #include <net/sock.h>
>>> +#include <net/fib_notifier.h>
>>>  #include <uapi/linux/mroute.h>
>>>  
>>>  #ifdef CONFIG_IP_MROUTE
>>> @@ -58,6 +59,14 @@ struct vif_device {
>>>     int             link;                   /* Physical interface index     
>>> */
>>>  };
>>>  
>>> +struct vif_entry_notifier_info {
>>> +   struct fib_notifier_info info;
>>> +   struct net_device *dev;
>>> +   vifi_t vif_index;
>>> +   unsigned short vif_flags;
>>> +   u32 tb_id;
>>> +};
>>> +
>>>  #define VIFF_STATIC 0x8000
>>>  
>>>  #define VIF_EXISTS(_mrt, _idx) ((_mrt)->vif_table[_idx].dev != NULL)
>>> @@ -146,6 +155,12 @@ struct mfc_cache {
>>>     struct rcu_head rcu;
>>>  };
>>>  
>>> +struct mfc_entry_notifier_info {
>>> +   struct fib_notifier_info info;
>>> +   struct mfc_cache *mfc;
>>> +   u32 tb_id;
>>> +};
>>> +
>>>  struct rtmsg;
>>>  int ipmr_get_route(struct net *net, struct sk_buff *skb,
>>>                __be32 saddr, __be32 daddr,
>>> diff --git a/include/net/netns/ipv4.h b/include/net/netns/ipv4.h
>>> index 8387f09..abc84d9 100644
>>> --- a/include/net/netns/ipv4.h
>>> +++ b/include/net/netns/ipv4.h
>>> @@ -163,6 +163,9 @@ struct netns_ipv4 {
>>>     struct fib_notifier_ops *notifier_ops;
>>>     unsigned int    fib_seq;        /* protected by rtnl_mutex */
>>>  
>>> +   struct fib_notifier_ops *ipmr_notifier_ops;
>> Can we add a const here?
> 
> It cannot be const as it get initialized it in ipmr_notifier_init.
> 
>>
>>> +   unsigned int    ipmr_seq;       /* protected by rtnl_mutex */
>>> +
>>>     atomic_t        rt_genid;
>>>  };
>>>  #endif
>>> diff --git a/net/ipv4/ipmr.c b/net/ipv4/ipmr.c
>>> index 86dc5f9..49879c3 100644
>>> --- a/net/ipv4/ipmr.c
>>> +++ b/net/ipv4/ipmr.c
>>> @@ -264,6 +264,16 @@ static void __net_exit ipmr_rules_exit(struct net *net)
>>>     fib_rules_unregister(net->ipv4.mr_rules_ops);
>>>     rtnl_unlock();
>>>  }
>>> +
>>> +static int ipmr_rules_dump(struct net *net, struct notifier_block *nb)
>>> +{
>>> +   return fib_rules_dump(net, nb, RTNL_FAMILY_IPMR);
>>> +}
>>> +
>>> +static unsigned int ipmr_rules_seq_read(struct net *net)
>>> +{
>>> +   return fib_rules_seq_read(net, RTNL_FAMILY_IPMR);
>>> +}
>>>  #else
>>>  #define ipmr_for_each_table(mrt, net) \
>>>     for (mrt = net->ipv4.mrt; mrt; mrt = NULL)
>>> @@ -298,6 +308,16 @@ static void __net_exit ipmr_rules_exit(struct net *net)
>>>     net->ipv4.mrt = NULL;
>>>     rtnl_unlock();
>>>  }
>>> +
>>> +static int ipmr_rules_dump(struct net *net, struct notifier_block *nb)
>>> +{
>>> +   return 0;
>>> +}
>>> +
>>> +static unsigned int ipmr_rules_seq_read(struct net *net)
>>> +{
>>> +   return 0;
>>> +}
>>>  #endif
>>>  
>>>  static inline int ipmr_hash_cmp(struct rhashtable_compare_arg *arg,
>>> @@ -587,6 +607,43 @@ static struct net_device *ipmr_reg_vif(struct net 
>>> *net, struct mr_table *mrt)
>>>  }
>>>  #endif
>>>  
>>> +static int call_ipmr_vif_entry_notifier(struct notifier_block *nb,
>>> +                                   struct net *net,
>>> +                                   enum fib_event_type event_type,
>>> +                                   struct vif_device *vif,
>>> +                                   vifi_t vif_index, u32 tb_id)
>>> +{
>>> +   struct vif_entry_notifier_info info = {
>>> +           .info = {
>>> +                   .family = RTNL_FAMILY_IPMR,
>>> +                   .net = net,
>>> +           },
>>> +           .dev = vif->dev,
>>> +           .vif_index = vif_index,
>>> +           .vif_flags = vif->flags,
>>> +           .tb_id = tb_id,
>>> +   };
>> We only use info.info which is fib_notifier_info, the
>> vif_entry_notifier_info seems to be not needed, why not just
>> use fib_notifier_info?
> 
> No, that's not true.
> 
> The driver gets the notification with a pointer to a fib_notifier_info struct,
> and according to the type field uses container_of to get to the parent struct,
> which in this case is vif_entry_notifier_info. All the fields here are needed.
> You can see this code in patch 10.
> 
> By the way, this function is completely symmetric to fib4 (which is in
> fib_trie.c +88) and fib6 (which is in ip6_fib +336) notify functions, who uses
> the exact same process.

Thanks for clarifying, I am not familar with ipmr, so only checking
coding style.


> 
>>
>>> +
>>> +   return call_fib_notifier(nb, net, event_type, &info.info);
>>> +}
>>> +
>>> +static int call_ipmr_mfc_entry_notifier(struct notifier_block *nb,
>>> +                                   struct net *net,
>>> +                                   enum fib_event_type event_type,
>>> +                                   struct mfc_cache *mfc, u32 tb_id)
>>> +{
>>> +   struct mfc_entry_notifier_info info = {
>>> +           .info = {
>>> +                   .family = RTNL_FAMILY_IPMR,
>>> +                   .net = net,
>>> +           },
>>> +           .mfc = mfc,
>>> +           .tb_id = tb_id
>>> +   };
>>> +
>> As above.
> 
> 
> As above.
> 
> 
>>
>>> +   return call_fib_notifier(nb, net, event_type, &info.info);
>>> +}
>>> +
>>>  /**
>>>   * vif_delete - Delete a VIF entry
>>>   * @notify: Set to 1, if the caller is a notifier_call
>>> @@ -3050,14 +3107,87 @@ static const struct net_protocol pim_protocol = {
>>>  };
>>>  #endif
>>>  
>>> +static unsigned int ipmr_seq_read(struct net *net)
>>> +{
>>> +   ASSERT_RTNL();
>>> +
>>> +   return net->ipv4.ipmr_seq + ipmr_rules_seq_read(net);
>>> +}
>>> +
>>> +static int ipmr_dump(struct net *net, struct notifier_block *nb)
>>> +{
>>> +   struct mr_table *mrt;
>>> +   int err;
>>> +
>>> +   err = ipmr_rules_dump(net, nb);
>>> +   if (err)
>>> +           return err;
>>> +
>>> +   ipmr_for_each_table(mrt, net) {
>>> +           struct vif_device *v = &mrt->vif_table[0];
>>> +           struct mfc_cache *mfc;
>>> +           int vifi;
>>> +
>>> +           /* Notifiy on table VIF entries */
>>> +           read_lock(&mrt_lock);
>>> +           for (vifi = 0; vifi < mrt->maxvif; vifi++, v++) {
>>> +                   if (!v->dev)
>>> +                           continue;
>>> +
>>> +                   call_ipmr_vif_entry_notifier(nb, net, FIB_EVENT_VIF_ADD,
>>> +                                                v, vifi, mrt->id);
>>> +           }
>>> +           read_unlock(&mrt_lock);
>>> +
>>> +           /* Notify on table MFC entries */
>>> +           list_for_each_entry_rcu(mfc, &mrt->mfc_cache_list, list)
>>> +                   call_ipmr_mfc_entry_notifier(nb, net,
>>> +                                                FIB_EVENT_ENTRY_ADD, mfc,
>>> +                                                mrt->id);
>>> +   }
>>> +
>>> +   return 0;
>>> +}
>>> +
>>> +static const struct fib_notifier_ops ipmr_notifier_ops_template = {
>>> +   .family         = RTNL_FAMILY_IPMR,
>>> +   .fib_seq_read   = ipmr_seq_read,
>>> +   .fib_dump       = ipmr_dump,
>>> +   .owner          = THIS_MODULE,
>>> +};
>>> +
>>> +int __net_init ipmr_notifier_init(struct net *net)
>>> +{
>>> +   struct fib_notifier_ops *ops;
>>> +
>>> +   net->ipv4.ipmr_seq = 0;
>>> +
>>> +   ops = fib_notifier_ops_register(&ipmr_notifier_ops_template, net);
>>> +   if (IS_ERR(ops))
>>> +           return PTR_ERR(ops);
>>> +   net->ipv4.ipmr_notifier_ops = ops;
>>> +
>>> +   return 0;
>>> +}
>>> +
>>> +static void __net_exit ipmr_notifier_exit(struct net *net)
>>> +{
>>> +   fib_notifier_ops_unregister(net->ipv4.ipmr_notifier_ops);
>>> +   net->ipv4.ipmr_notifier_ops = NULL;
>>> +}
>>> +
>>>  /* Setup for IP multicast routing */
>>>  static int __net_init ipmr_net_init(struct net *net)
>>>  {
>>>     int err;
>>>  
>>> +   err = ipmr_notifier_init(net);
>>> +   if (err)
>>> +           goto ipmr_notifier_fail;
>>> +
>>>     err = ipmr_rules_init(net);
>>>     if (err < 0)
>>> -           goto fail;
>>> +           goto ipmr_rules_fail;
>>>  
>>>  #ifdef CONFIG_PROC_FS
>>>     err = -ENOMEM;
>>> @@ -3074,7 +3204,9 @@ static int __net_init ipmr_net_init(struct net *net)
>>>  proc_vif_fail:
>>>     ipmr_rules_exit(net);
>>>  #endif
>>> -fail:
>>> +ipmr_rules_fail:
>>> +   ipmr_notifier_exit(net);
>>> +ipmr_notifier_fail:
>>>     return err;
>>>  }
>>>  
>>> @@ -3084,6 +3216,7 @@ static void __net_exit ipmr_net_exit(struct net *net)
>>>     remove_proc_entry("ip_mr_cache", net->proc_net);
>>>     remove_proc_entry("ip_mr_vif", net->proc_net);
>>>  #endif
>>> +   ipmr_notifier_exit(net);
>>>     ipmr_rules_exit(net);
>>>  }
>>>  
>>>
> 
> 
> .
> 

Reply via email to